diff --git a/results/hipManaged_HostToGPUWriteDst.json b/results/hipManaged_HostToGPUWriteDst.json deleted file mode 100644 index ce1d330..0000000 --- a/results/hipManaged_HostToGPUWriteDst.json +++ /dev/null @@ -1,25272 +0,0 @@ -{ - "context": { - "date": "2023-10-09T15:03:52-04:00", - "host_name": "frontier10485", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1796, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [1.86,2.42,2.52], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8637057530223122e+06, - "cpu_time": 2.0665387037037041e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1977718281749398e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8671588987725228e+06, - "cpu_time": 2.0667462645502645e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1937072429629453e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8739381494159470e+06, - "cpu_time": 2.0730184841269834e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1857711799488184e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8683880865210472e+06, - "cpu_time": 2.0676043571428584e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1922640320549160e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8635952986538764e+06, - "cpu_time": 2.0678864179894177e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1979020890204264e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8673572372771413e+06, - "cpu_time": 2.0683588455026455e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1934832744324091e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8671588987725228e+06, - "cpu_time": 2.0676043571428582e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1937072429629453e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2395728667930953e+03, - "cpu_time": 2.6654270785914614e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9731964261298881e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2703598337589469e-03, - "cpu_time": 1.2886676237960624e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2672597890753300e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8629308771286455e+06, - "cpu_time": 2.0684725782493372e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3973719586560363e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8679243958272925e+06, - "cpu_time": 2.0687235517241363e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3856164726473382e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8629113614470551e+06, - "cpu_time": 2.0689651167108782e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3974180251049055e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8678853422695454e+06, - "cpu_time": 2.0684756312997309e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3857081666728193e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8731127194518319e+06, - "cpu_time": 2.0736159946949594e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3734687800301714e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8669529392248741e+06, - "cpu_time": 2.0696505745358083e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3879166806222545e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8678853422695459e+06, - "cpu_time": 2.0687235517241366e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3857081666728193e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2505096827767875e+03, - "cpu_time": 2.2260922948151015e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9823362968964302e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2767096017650684e-03, - "cpu_time": 1.0755884699591768e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2749603111153027e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8738656192568664e+06, - "cpu_time": 2.0765487665782480e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7434231311087999e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8682567012211895e+06, - "cpu_time": 2.0702982281167121e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7696728127834722e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8639770245239132e+06, - "cpu_time": 2.0705536684350127e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7898079131016713e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8683870033160609e+06, - "cpu_time": 2.0705153740053021e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7690612121157218e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8637766974549852e+06, - "cpu_time": 2.0708473740053065e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7907526810334064e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8676526091546032e+06, - "cpu_time": 2.0717526822281168e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7725435500286128e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8682567012211897e+06, - "cpu_time": 2.0705536684350125e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7696728127834722e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1242687358012035e+03, - "cpu_time": 2.6882155114591037e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9351984989332330e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2082633117023096e-03, - "cpu_time": 1.2975561873379584e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2059719486110969e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8716086091184050e+06, - "cpu_time": 2.0755924350132644e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7507933998783488e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8754222987893478e+06, - "cpu_time": 2.0789770079575600e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7472331442978423e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8758420435732123e+06, - "cpu_time": 2.0796438010610035e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7468421774778873e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8709020005382809e+06, - "cpu_time": 2.0745898620689707e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7514546454369202e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8666112887415544e+06, - "cpu_time": 2.0747421405835503e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7554806508264378e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8720772481521603e+06, - "cpu_time": 2.0767090493368700e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7503608035834875e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8716086091184050e+06, - "cpu_time": 2.0755924350132649e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7507933998783488e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7696349326532609e+03, - "cpu_time": 2.4167600343725330e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5270188410992007e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0136107825540271e-03, - "cpu_time": 1.1637451260417282e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0150238932901080e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8714762595266015e+06, - "cpu_time": 2.0802470026525266e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5018344297125965e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8670684023033357e+06, - "cpu_time": 2.0805393554376618e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5101017144926541e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8677792800950140e+06, - "cpu_time": 2.0806227214854066e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5087657679051980e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8724116509633919e+06, - "cpu_time": 2.0805347294429706e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5000850355892874e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8767881089942197e+06, - "cpu_time": 2.0857709496021164e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4919232323525898e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8711047403765128e+06, - "cpu_time": 2.0815429517241367e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5025420360104658e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8714762595266018e+06, - "cpu_time": 2.0805393554376620e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5018344297125965e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9210149109476524e+03, - "cpu_time": 2.3678044375250279e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3345096340433694e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0955614222636443e-03, - "cpu_time": 1.1375236987369304e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0940532786289318e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8795514765673594e+06, - "cpu_time": 2.0964044601063889e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9735786241607964e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8749812780755593e+06, - "cpu_time": 2.0910561250000035e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9905764677570283e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8698948935049516e+06, - "cpu_time": 2.0903210771276567e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0095918468613595e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8767365901944591e+06, - "cpu_time": 2.0936844893617060e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9840381801486015e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8691617025708300e+06, - "cpu_time": 2.0894307340425544e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0123414052259162e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8740651881826320e+06, - "cpu_time": 2.0921793771276618e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9940253048307404e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8749812780755595e+06, - "cpu_time": 2.0910561250000033e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9905764677570283e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4584329782528384e+03, - "cpu_time": 2.8454657815994524e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6639566186502579e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3790170194540501e-03, - "cpu_time": 1.3600486711163229e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3791115218027175e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8738475006927426e+06, - "cpu_time": 2.1087236879999978e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3989612276510656e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8736764288429790e+06, - "cpu_time": 2.1088695066666692e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3990889566875616e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8735868667329974e+06, - "cpu_time": 2.1084762079999940e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3991558366178378e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8771964905317873e+06, - "cpu_time": 2.1088502693333263e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3964654276853979e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8735651510845248e+06, - "cpu_time": 2.1087042906666701e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3991720536019593e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8743744875770067e+06, - "cpu_time": 2.1087247925333316e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3985687004487643e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8736764288429793e+06, - "cpu_time": 2.1087236879999978e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3990889566875616e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5814608750967111e+03, - "cpu_time": 1.5724377969826753e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1786925370935374e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4372727306006843e-04, - "cpu_time": 7.4568184646495097e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4278486764027090e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 369, - "real_time": 1.8973187801363778e+06, - "cpu_time": 2.1582894607045953e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7633100219580102e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 369, - "real_time": 1.8981521569639142e+06, - "cpu_time": 2.1593367371273790e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7620968007043034e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 369, - "real_time": 1.8947510162953963e+06, - "cpu_time": 2.1581336693766932e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7670548557091379e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 369, - "real_time": 1.8925626350814088e+06, - "cpu_time": 2.1556046937669232e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7702544173786235e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 369, - "real_time": 1.8920644174921794e+06, - "cpu_time": 2.1556611951219616e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7709838795811880e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8949698011938557e+06, - "cpu_time": 2.1574051512195105e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7667399950662529e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8947510162953965e+06, - "cpu_time": 2.1581336693766932e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7670548557091379e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7353546522690676e+03, - "cpu_time": 1.6827652833482593e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9932701694225497e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4434819227967426e-03, - "cpu_time": 7.7999502429900423e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4433124097470264e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 371, - "real_time": 1.9078648546704333e+06, - "cpu_time": 2.2344598086253395e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4960706332688963e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 371, - "real_time": 1.9041874813577386e+06, - "cpu_time": 2.2317536522911065e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5066846634887874e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 371, - "real_time": 1.9091664603377902e+06, - "cpu_time": 2.2345259973045839e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4923235966259050e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 371, - "real_time": 1.9045377028114451e+06, - "cpu_time": 2.2318096603773688e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5056720507664955e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 371, - "real_time": 1.9090931942294834e+06, - "cpu_time": 2.2340756091644266e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4925343779417169e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9069699386813785e+06, - "cpu_time": 2.2333249455525652e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4986570644183612e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9078648546704333e+06, - "cpu_time": 2.2340756091644270e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4960706332688963e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4388335438792383e+03, - "cpu_time": 1.4194177536187278e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0345950541591237e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2789050809923256e-03, - "cpu_time": 6.3556257518430134e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2793296566319383e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 361, - "real_time": 1.9505058756740533e+06, - "cpu_time": 2.4047546288088541e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0751836362837253e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 361, - "real_time": 1.9524946140958681e+06, - "cpu_time": 2.4068352326869760e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0740884942062273e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 361, - "real_time": 1.9507576737919217e+06, - "cpu_time": 2.4053017202216126e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0750448547120228e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 361, - "real_time": 1.9520128462166935e+06, - "cpu_time": 2.4054533324099649e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0743535853591378e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 361, - "real_time": 1.9510839104786557e+06, - "cpu_time": 2.4058945484764525e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0748650986955807e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9513709840514385e+06, - "cpu_time": 2.4056478925207723e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0747071338513389e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9510839104786557e+06, - "cpu_time": 2.4054533324099653e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0748650986955807e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4874977650948608e+02, - "cpu_time": 7.7881717766649945e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6737949942204356e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.3495049554714144e-04, - "cpu_time": 3.2374529127386609e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3489010605813548e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 350, - "real_time": 2.0102761516214479e+06, - "cpu_time": 2.7083918371428493e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0864317554665110e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 350, - "real_time": 2.0105623354070953e+06, - "cpu_time": 2.7083039885714301e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0861347724146760e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 350, - "real_time": 2.0124988344364932e+06, - "cpu_time": 2.7115545742857093e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0841274182275090e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 350, - "real_time": 2.0094999827311509e+06, - "cpu_time": 2.7088186114285812e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0872376392357264e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 350, - "real_time": 2.0083059365528501e+06, - "cpu_time": 2.7073485657142880e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0884786145677080e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0102286481498077e+06, - "cpu_time": 2.7088835154285715e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0864820399824262e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0102761516214483e+06, - "cpu_time": 2.7083918371428489e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0864317554665110e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5407078499262168e+03, - "cpu_time": 1.5868551833563915e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5987969861367641e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.6643413242780481e-04, - "cpu_time": 5.8579675881904273e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6626443721999654e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 332, - "real_time": 2.1187884028978557e+06, - "cpu_time": 3.3496945873493967e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9591532540611162e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 332, - "real_time": 2.1158705524404543e+06, - "cpu_time": 3.3467632108433880e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9646130479601140e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 332, - "real_time": 2.1203076978864889e+06, - "cpu_time": 3.3508787951807156e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9563163442559390e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 332, - "real_time": 2.1142748914552424e+06, - "cpu_time": 3.3470243042168580e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9676051746640058e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 332, - "real_time": 2.1205144704330759e+06, - "cpu_time": 3.3506921807228960e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9559305616465716e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1179512030226234e+06, - "cpu_time": 3.3490106156626507e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9607236765175495e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1187884028978557e+06, - "cpu_time": 3.3496945873493967e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9591532540611162e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7689657398971035e+03, - "cpu_time": 1.9863178627779587e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1804194199929414e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3073793843528536e-03, - "cpu_time": 5.9310587236969278e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3079476992315215e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 216, - "real_time": 3.2404116333324322e+06, - "cpu_time": 5.5651034675926017e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1774952994926596e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 216, - "real_time": 3.2426983848886769e+06, - "cpu_time": 5.5695314537037127e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1738441287612896e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 216, - "real_time": 3.2435974334711554e+06, - "cpu_time": 5.5699233009259049e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1724100613946295e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 216, - "real_time": 3.2413723475420503e+06, - "cpu_time": 5.5656653101851996e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1759607354959545e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 216, - "real_time": 3.2426026968837338e+06, - "cpu_time": 5.5650260555555578e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1739968069858055e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2421364992236099e+06, - "cpu_time": 5.5670499175925953e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1747414064260674e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2426026968837334e+06, - "cpu_time": 5.5656653101851996e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1739968069858055e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2476452584458166e+03, - "cpu_time": 2.4604967013991381e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9915694570865461e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8482194032996101e-04, - "cpu_time": 4.4197496660190733e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8486357107881503e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 108, - "real_time": 6.4752646075147726e+06, - "cpu_time": 1.0791743944444470e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1819398949440460e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 108, - "real_time": 6.4792202535533793e+06, - "cpu_time": 1.0790454768518558e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1787762549973269e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 108, - "real_time": 6.4819447601352027e+06, - "cpu_time": 1.0797768675926041e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1765994993299065e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 108, - "real_time": 6.4812114902047645e+06, - "cpu_time": 1.0805205685185134e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1771851683457251e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 108, - "real_time": 6.4907196124463724e+06, - "cpu_time": 1.0828757203703716e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1696012158123760e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4816721447708989e+06, - "cpu_time": 1.0802786055555584e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1768204066858768e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4812114902047645e+06, - "cpu_time": 1.0797768675926041e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1771851683457251e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6835617635047947e+03, - "cpu_time": 1.5648626933941498e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5368786241820492e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7686659191641152e-04, - "cpu_time": 1.4485732526280872e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7638323676878167e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 53, - "real_time": 1.3288090023089129e+07, - "cpu_time": 2.2032856528301824e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0503017275916195e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 53, - "real_time": 1.3273665681481361e+07, - "cpu_time": 2.1997827962264154e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0557898330697260e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 53, - "real_time": 1.3281047027909530e+07, - "cpu_time": 2.2037747773584943e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0529799238699856e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 53, - "real_time": 1.3270097731981637e+07, - "cpu_time": 2.2034948377358567e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0571491902628632e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 53, - "real_time": 1.3258061424460052e+07, - "cpu_time": 2.2023639037735753e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0617403141751604e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3274192377784345e+07, - "cpu_time": 2.2025403935849048e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0555921977938719e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3273665681481361e+07, - "cpu_time": 2.2032856528301828e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0557898330697260e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1373015887496633e+04, - "cpu_time": 1.6298443272543740e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3323108805163093e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.5677648506364014e-04, - "cpu_time": 7.3998385319126974e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5693440274055657e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5632657908967562e+07, - "cpu_time": 4.2015903178571425e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2362001816847887e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.5611840321549349e+07, - "cpu_time": 4.2012037000000238e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2404562231739197e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.5645903311669827e+07, - "cpu_time": 4.2056258249999702e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2334958285102015e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5600480514445476e+07, - "cpu_time": 4.1998232499999747e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2427815924886847e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5637046367462192e+07, - "cpu_time": 4.2031203678571366e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2353038675447931e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5625585684818886e+07, - "cpu_time": 4.2022726921428502e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2376475386804771e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5632657908967566e+07, - "cpu_time": 4.2015903178571433e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2362001816847887e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8797434350808478e+04, - "cpu_time": 2.2119109238842309e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8429009588903016e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.3354164786736782e-04, - "cpu_time": 5.2636063528669274e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3370743840820666e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 14, - "real_time": 5.0024046695658140e+07, - "cpu_time": 8.0855187642856866e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3661283668859797e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 14, - "real_time": 5.0035932234355383e+07, - "cpu_time": 8.0903674999999806e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3648536963939772e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 14, - "real_time": 5.0016686320304871e+07, - "cpu_time": 8.0859939999999359e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3669180377314482e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 14, - "real_time": 4.9957604812724248e+07, - "cpu_time": 8.0851532142857656e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3732651316307545e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 14, - "real_time": 5.0030336316142760e+07, - "cpu_time": 8.0852397285714313e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3654537579709759e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0012921275837086e+07, - "cpu_time": 8.0864546414285600e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3673237981226273e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0024046695658140e+07, - "cpu_time": 8.0855187642856866e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3661283668859797e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1743698016587317e+04, - "cpu_time": 2.2118004374465865e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4092372274395926e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.3470993508878994e-04, - "cpu_time": 2.7351917935890973e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3518381891401244e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 9.8500934739907578e+07, - "cpu_time": 1.5723903466666734e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4504143886310463e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 9.8667867481708527e+07, - "cpu_time": 1.5737451211111084e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4411930216240606e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 9.8673563864496022e+07, - "cpu_time": 1.5737583888888827e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4408789038699436e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 9.8686150378651083e+07, - "cpu_time": 1.5749301011111230e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4401849696240864e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 9.8810971611075938e+07, - "cpu_time": 1.5758711333333349e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4333127510692444e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8667897615167841e+07, - "cpu_time": 1.5741390182222244e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4411968069636765e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8673563864496022e+07, - "cpu_time": 1.5737583888888830e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4408789038699436e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1035402198929476e+05, - "cpu_time": 1.3213554336765135e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0878370677803131e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1184389721133623e-03, - "cpu_time": 8.3941470123064747e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1188415497099945e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7548662051558495e+08, - "cpu_time": 2.8295565350000018e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1186534953224030e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7585363611578941e+08, - "cpu_time": 2.8338289299999887e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1058835501871758e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7552291974425316e+08, - "cpu_time": 2.8288711749999964e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1173881198222017e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7636067420244217e+08, - "cpu_time": 2.8379837500000352e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0883290952237196e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7532899603247643e+08, - "cpu_time": 2.8317925324999750e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1241542944848061e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7571056932210925e+08, - "cpu_time": 2.8324065844999993e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1108817110080614e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7552291974425316e+08, - "cpu_time": 2.8317925324999750e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1173881198222017e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1050824298441241e+05, - "cpu_time": 3.6785460467934085e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4252171321563601e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3362751857680035e-03, - "cpu_time": 1.2987351699165664e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3322610378613499e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8653959957610201e+06, - "cpu_time": 2.0670536904761684e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1957804183711493e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8619631477959622e+06, - "cpu_time": 2.0679179074074042e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1998287156480541e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8666776288622590e+06, - "cpu_time": 2.0670429338624051e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1942728281886117e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8622311334222404e+06, - "cpu_time": 2.0680946666666551e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1995121478141872e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8667443865818088e+06, - "cpu_time": 2.0673297671958148e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1941943575361036e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8646024584846583e+06, - "cpu_time": 2.0674877931216892e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1967176935116211e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8653959957610201e+06, - "cpu_time": 2.0673297671958145e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1957804183711493e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3512248370793013e+03, - "cpu_time": 4.9107302349539930e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7708531705019068e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2609791574500636e-03, - "cpu_time": 2.3752160720326706e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2613606102805529e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8699633056861805e+06, - "cpu_time": 2.0732202142857693e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3808346265885457e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8694025817413128e+06, - "cpu_time": 2.0728949708994767e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3821486500619408e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8668607600572552e+06, - "cpu_time": 2.0698006455026935e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3881151584913908e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8630634143529090e+06, - "cpu_time": 2.0708296931217324e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3970591322278194e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8670075489411366e+06, - "cpu_time": 2.0701158968253722e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3877701537125809e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8672595221557587e+06, - "cpu_time": 2.0713722841270089e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3871855442164559e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8670075489411366e+06, - "cpu_time": 2.0708296931217327e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3877701537125809e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7263974476803055e+03, - "cpu_time": 1.5871659407034608e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4108920711892742e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4601063298007276e-03, - "cpu_time": 7.6623886148615740e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4612767129579538e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8637051782655697e+06, - "cpu_time": 2.0736394854111797e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7910900238242261e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8681291539351076e+06, - "cpu_time": 2.0729346604774226e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7702715658004880e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8715795572425316e+06, - "cpu_time": 2.0768844111405446e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7541028841644134e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8719916783281865e+06, - "cpu_time": 2.0772831697612451e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7521756585114766e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8659180500133911e+06, - "cpu_time": 2.0707349628646953e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7806642954562865e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8682647235569577e+06, - "cpu_time": 2.0742953379310179e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7696608855513781e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8681291539351079e+06, - "cpu_time": 2.0736394854111797e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7702715658004880e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5774650009194761e+03, - "cpu_time": 2.7653343105076010e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6796134219130046e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9148597925182683e-03, - "cpu_time": 1.3331439645744235e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9152546989362881e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8646944900293739e+06, - "cpu_time": 2.0770412042440274e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7572851839919265e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8693527596785296e+06, - "cpu_time": 2.0765771458885854e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7529061773035858e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8652369172242223e+06, - "cpu_time": 2.0773277559681837e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7567741501044352e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8694970482482947e+06, - "cpu_time": 2.0763734217506472e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7527708872663576e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8745385391496564e+06, - "cpu_time": 2.0815745331564941e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7480568852355786e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8686639508660156e+06, - "cpu_time": 2.0777788122015879e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7535586567803767e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8693527596785296e+06, - "cpu_time": 2.0770412042440276e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7529061773035858e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9743073372910030e+03, - "cpu_time": 2.1548862521036440e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7263320700245902e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1268175775795034e-03, - "cpu_time": 1.0371105140976745e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1250113622468302e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8769245327941936e+06, - "cpu_time": 2.0901369681697651e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4916694227676801e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8706382617038805e+06, - "cpu_time": 2.0833231989389537e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5034031614592440e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8656540789466354e+06, - "cpu_time": 2.0840197347479502e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5127626680398434e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8702893991639966e+06, - "cpu_time": 2.0836875994695188e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5040566464897916e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8666747537546849e+06, - "cpu_time": 2.0847538435013462e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5108419325958602e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8700362052726783e+06, - "cpu_time": 2.0851842689655074e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5045467662704840e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8702893991639963e+06, - "cpu_time": 2.0840197347479505e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5040566464897916e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4265681566584908e+03, - "cpu_time": 2.8184320397755550e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2840839264217982e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3671029171400629e-03, - "cpu_time": 1.3516465099623180e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3638103523548259e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8687503875008454e+06, - "cpu_time": 2.0987034574467754e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0138848332380995e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8774252788948906e+06, - "cpu_time": 2.1029305585106602e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9814762522614449e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8732116552316856e+06, - "cpu_time": 2.0982608962765397e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9971804645742789e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8700831623139861e+06, - "cpu_time": 2.0988155292553273e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0088861629990488e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8781733905733686e+06, - "cpu_time": 2.1037253537234152e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9786953993628010e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8735287749029554e+06, - "cpu_time": 2.1004871590425437e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9960246224871352e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8732116552316856e+06, - "cpu_time": 2.0988155292553273e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9971804645742789e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2296866092492983e+03, - "cpu_time": 2.6166910967421650e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5793189779537887e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2576042951186525e-03, - "cpu_time": 1.2457543886794911e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2574520004938602e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8811295734501092e+06, - "cpu_time": 2.1257958138297554e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3935456849961245e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8821163567020237e+06, - "cpu_time": 2.1264830824468075e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3928150566596591e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8807623416657231e+06, - "cpu_time": 2.1255781968085393e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3938177843768847e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8808742264267725e+06, - "cpu_time": 2.1253071781915152e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3937348724162868e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8815393867314807e+06, - "cpu_time": 2.1259181409574733e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3932421603747764e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8812843769952219e+06, - "cpu_time": 2.1258164824468186e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3934311117647463e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8811295734501090e+06, - "cpu_time": 2.1257958138297554e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3935456849961245e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5270442127543367e+02, - "cpu_time": 4.3911504057555777e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0931033153342221e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9379100152748328e-04, - "cpu_time": 2.0656300494487450e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9374278217101149e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.9019490625973421e+06, - "cpu_time": 2.1834389973118245e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7565827619169843e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8978019544456694e+06, - "cpu_time": 2.1812802419355218e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7626064920622325e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8955408784833746e+06, - "cpu_time": 2.1791155618279665e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7659018381048244e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8952828115327987e+06, - "cpu_time": 2.1788024999999399e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7662784509504694e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8956974467640663e+06, - "cpu_time": 2.1791814354838775e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7656733984368318e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8972544307646502e+06, - "cpu_time": 2.1803637473118259e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7634085882942688e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8956974467640663e+06, - "cpu_time": 2.1791814354838775e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7656733984368318e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8101198024781929e+03, - "cpu_time": 1.9805584055061086e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0870843933053303e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4811507391476379e-03, - "cpu_time": 9.0836146397496392e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4790011186250631e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8924553179174601e+06, - "cpu_time": 2.2583985591397751e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5408230253694892e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8999830579325077e+06, - "cpu_time": 2.2634749112902619e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5188702637223625e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8923675725286605e+06, - "cpu_time": 2.2586013010752639e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5410799425126958e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8987959859171703e+06, - "cpu_time": 2.2616611559139681e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5223205008699727e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8920402925227447e+06, - "cpu_time": 2.2587787043010220e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5420384235152054e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8951284453637090e+06, - "cpu_time": 2.2601829263440585e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5330264311979449e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8924553179174601e+06, - "cpu_time": 2.2587787043010225e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5408230253694892e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9154448670976649e+03, - "cpu_time": 2.2737453630389032e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1422302225383462e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0660577791845776e-03, - "cpu_time": 1.0060005924904416e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0643859861176265e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 361, - "real_time": 1.9445494260739568e+06, - "cpu_time": 2.4517262049861229e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0784770867121377e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 361, - "real_time": 1.9434303120410694e+06, - "cpu_time": 2.4512840443212888e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0790981220198660e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 361, - "real_time": 1.9417345914680129e+06, - "cpu_time": 2.4500562548476579e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0800405004962530e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 361, - "real_time": 1.9406903765055961e+06, - "cpu_time": 2.4489722520775483e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0806216310383980e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 361, - "real_time": 1.9415573025421549e+06, - "cpu_time": 2.4496631911356612e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0801391219585018e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9423924017261579e+06, - "cpu_time": 2.4503403894736553e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0796752924450314e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9417345914680131e+06, - "cpu_time": 2.4500562548476579e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0800405004962530e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5618103833133946e+03, - "cpu_time": 1.1425956321379379e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6788451821656548e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0406532785314185e-04, - "cpu_time": 4.6630077888214244e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0383845429226708e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 354, - "real_time": 1.9760276914421616e+06, - "cpu_time": 2.7870536610169755e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1225937359910562e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 354, - "real_time": 1.9739828132340254e+06, - "cpu_time": 2.7865640423729317e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1247925624683464e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 354, - "real_time": 1.9721504456053178e+06, - "cpu_time": 2.7861275706215044e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1267667531888676e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 354, - "real_time": 1.9741960635769186e+06, - "cpu_time": 2.7866133446327327e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1245630448683050e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 354, - "real_time": 1.9738019442732977e+06, - "cpu_time": 2.7867744406779720e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1249872674252701e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9740317916263442e+06, - "cpu_time": 2.7866266118644234e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1247406727883692e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9739828132340256e+06, - "cpu_time": 2.7866133446327327e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1247925624683464e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3788847750292057e+03, - "cpu_time": 3.3814104250203224e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4840310418316727e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.9851193931035158e-04, - "cpu_time": 1.2134422353621148e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9845278571531672e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 348, - "real_time": 2.0250472693099242e+06, - "cpu_time": 3.5182854224137696e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1424257730332322e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 348, - "real_time": 2.0076711712292687e+06, - "cpu_time": 3.5100135201149266e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1782778575556149e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 348, - "real_time": 2.0270210676746252e+06, - "cpu_time": 3.5161627298850259e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1383921133209105e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 348, - "real_time": 2.0595760380410342e+06, - "cpu_time": 3.4209819712643903e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0729780523077092e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 348, - "real_time": 2.1280676090351208e+06, - "cpu_time": 3.3558140201148721e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9418897991701717e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0494766310579949e+06, - "cpu_time": 3.4642515327585973e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0947927190775280e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0270210676746250e+06, - "cpu_time": 3.5100135201149271e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1383921133209105e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7768405757844077e+04, - "cpu_time": 7.3040300871213694e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3534440123291478e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3307611823407202e-02, - "cpu_time": 2.1084006221987989e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2842289351428478e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 217, - "real_time": 3.2330593952591517e+06, - "cpu_time": 5.5389429447004683e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1892693417886286e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 217, - "real_time": 3.2336360159059684e+06, - "cpu_time": 5.5407397327189604e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1883439934100075e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 217, - "real_time": 3.2328050487035294e+06, - "cpu_time": 5.5395317926267991e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1896776165727234e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 217, - "real_time": 3.2336462980076191e+06, - "cpu_time": 5.5407249539170228e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1883274959098415e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 217, - "real_time": 3.2388017768220557e+06, - "cpu_time": 5.5468687880184976e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1800687896565161e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2343897069396651e+06, - "cpu_time": 5.5413616423963513e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1871374474675436e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2336360159059693e+06, - "cpu_time": 5.5407249539170237e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1883439934100075e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4933881847506741e+03, - "cpu_time": 3.1748718659660735e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9948505644541951e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7089912183460525e-04, - "cpu_time": 5.7294074468547168e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7014550027097413e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 107, - "real_time": 6.4497282336875098e+06, - "cpu_time": 1.0729077588785185e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.2024567213145800e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 107, - "real_time": 6.4598218163597248e+06, - "cpu_time": 1.0763218383177523e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1943277932252293e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 107, - "real_time": 6.4698285901936414e+06, - "cpu_time": 1.0769785102803659e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1862938147787495e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 107, - "real_time": 6.4693455732314382e+06, - "cpu_time": 1.0761629336448690e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1866810359984465e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 107, - "real_time": 6.4616730941511756e+06, - "cpu_time": 1.0750865691588724e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1928396115198097e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4620794615246989e+06, - "cpu_time": 1.0754915220560756e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1925197953673630e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4616730941511756e+06, - "cpu_time": 1.0761629336448690e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.1928396115198097e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2258783674999322e+03, - "cpu_time": 1.5961807230101176e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6137655908627426e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2729460255753453e-03, - "cpu_time": 1.4841406838415722e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2737102315456515e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 54, - "real_time": 1.3215825392830150e+07, - "cpu_time": 2.1883666537036631e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0779169673661013e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 54, - "real_time": 1.3218089231048469e+07, - "cpu_time": 2.1890109759259194e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0770472817179546e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 54, - "real_time": 1.3238667079282029e+07, - "cpu_time": 2.1900477888888970e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0691556482315826e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 54, - "real_time": 1.3229964714911249e+07, - "cpu_time": 2.1882920148148291e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0724900214104757e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 54, - "real_time": 1.3275241841458611e+07, - "cpu_time": 2.1925055870370246e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0551895627557497e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3235557651906101e+07, - "cpu_time": 2.1896446040740661e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0703598962963734e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3229964714911249e+07, - "cpu_time": 2.1890109759259194e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0724900214104757e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4032749316137168e+04, - "cpu_time": 1.7472779541221302e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1918049511072636e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8157715714136248e-03, - "cpu_time": 7.9797331076976322e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8128505942588780e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5522057632250447e+07, - "cpu_time": 4.1826264464285754e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2588913454375410e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.5580400734075479e+07, - "cpu_time": 4.1887044607142746e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2468970050656586e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.5570555190954890e+07, - "cpu_time": 4.1876360607142866e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2489172408535357e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5561915843614511e+07, - "cpu_time": 4.1881215107143328e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2506912557388859e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5565904365586381e+07, - "cpu_time": 4.1861169249999978e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2498720984291515e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5560166753296342e+07, - "cpu_time": 4.1866410807142936e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2510537891049547e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5565904365586385e+07, - "cpu_time": 4.1876360607142873e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2498720984291515e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2392064631524805e+04, - "cpu_time": 2.4408616749659683e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6043133185481634e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7605315128224011e-04, - "cpu_time": 5.8301192481241472e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7683606062107606e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 14, - "real_time": 4.9962869446192466e+07, - "cpu_time": 8.0656709428570896e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3726989457459335e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 14, - "real_time": 4.9967598968318529e+07, - "cpu_time": 8.0639374785714522e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3721904102336178e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 14, - "real_time": 4.9963975591318950e+07, - "cpu_time": 8.0544187499999762e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3725800003520870e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 14, - "real_time": 4.9962455938969336e+07, - "cpu_time": 8.0624483928571865e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3727434121313429e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 14, - "real_time": 4.9923163971730642e+07, - "cpu_time": 8.0566655428571358e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3769720234880056e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9956012783305988e+07, - "cpu_time": 8.0606282214285702e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3734369583901978e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9962869446192473e+07, - "cpu_time": 8.0624483928571880e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3726989457459335e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8474431642528631e+04, - "cpu_time": 4.8464833414919281e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9881281207809520e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6981397459931610e-04, - "cpu_time": 6.0125379912795375e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6999189460604854e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 8.2339207331339523e+07, - "cpu_time": 1.5326703777777576e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.5202341557599497e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 8.2411971357133657e+07, - "cpu_time": 1.5323738988888952e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.5144772435240135e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 8.2214141885439560e+07, - "cpu_time": 1.5308496722222269e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.5301528385237808e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 8.2228523161676198e+07, - "cpu_time": 1.5297504977777660e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.5290107539012270e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 8.2198532091246709e+07, - "cpu_time": 1.5303727777777630e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.5313929378207369e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2278475165367126e+07, - "cpu_time": 1.5312034448888820e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.5250535859059410e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2228523161676198e+07, - "cpu_time": 1.5308496722222269e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.5290107539012270e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2917299090918968e+04, - "cpu_time": 1.2696527991905920e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3643544127642307e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1293026384381752e-03, - "cpu_time": 8.2918622174516443e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1286274228722308e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7823755741119385e+08, - "cpu_time": 2.7692496224999982e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0242175644433842e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7819091677665710e+08, - "cpu_time": 2.7695264149999589e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0257943750624418e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7814448103308678e+08, - "cpu_time": 2.7687966725000024e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0273650790257931e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7813486233353615e+08, - "cpu_time": 2.7695191499999791e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0276905370131721e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7821199074387550e+08, - "cpu_time": 2.7701930899999636e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0250818113758183e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7818396165966988e+08, - "cpu_time": 2.7694569899999803e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0260298733841219e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7819091677665710e+08, - "cpu_time": 2.7695191499999797e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0257943750624418e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3806310975324610e+04, - "cpu_time": 5.0733307397219120e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4814960775648379e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4584878777695132e-04, - "cpu_time": 1.8318864521243018e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4584944128941953e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8684413580054671e+06, - "cpu_time": 2.0710293984169727e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1922015280010812e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8732680107950969e+06, - "cpu_time": 2.0758636147757180e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1865531127398470e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8686072989277872e+06, - "cpu_time": 2.0708710554090417e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1920068504229314e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8741013784578014e+06, - "cpu_time": 2.0766786015830461e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1855808053300721e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8683835485832468e+06, - "cpu_time": 2.0706497440633727e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1922693566349931e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8705603189538799e+06, - "cpu_time": 2.0730184828496303e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1897223306257850e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8686072989277872e+06, - "cpu_time": 2.0710293984169730e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1920068504229314e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8685061218371716e+03, - "cpu_time": 2.9862212638114916e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3559263104792972e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5335010011553103e-03, - "cpu_time": 1.4405183979385200e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5325807585476973e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8618566833278495e+06, - "cpu_time": 2.0706044550264676e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3999090119856941e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8619819571473205e+06, - "cpu_time": 2.0711497407407379e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3996129868791457e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8659908634651436e+06, - "cpu_time": 2.0703124523809687e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3901608311133217e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8717089861980332e+06, - "cpu_time": 2.0755895264550245e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3767487683222881e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8663298945828394e+06, - "cpu_time": 2.0704036031747458e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3893633294831133e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8655736769442372e+06, - "cpu_time": 2.0716119555555887e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3911589855567133e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8659908634651434e+06, - "cpu_time": 2.0706044550264678e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3901608311133217e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0343655632064342e+03, - "cpu_time": 2.2471423009854007e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4856227340298410e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1625334946913611e-03, - "cpu_time": 1.0847312861653844e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1601638121574980e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8723346030614623e+06, - "cpu_time": 2.0782423597883661e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7505726664509922e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8676420867060577e+06, - "cpu_time": 2.0730528068781949e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7725587876937930e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8631218444887381e+06, - "cpu_time": 2.0733030634920653e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7938424684704170e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8629390051597347e+06, - "cpu_time": 2.0738852936509138e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7947055457111858e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8675459890339028e+06, - "cpu_time": 2.0731915343915755e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7730101942365449e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8667167056899793e+06, - "cpu_time": 2.0743350116402232e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7769379325125869e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8675459890339028e+06, - "cpu_time": 2.0733030634920653e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7730101942365449e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8826170335066417e+03, - "cpu_time": 2.2071543939289559e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8242688305759482e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0799176552456799e-03, - "cpu_time": 1.0640298609161062e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0784798122113553e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8778815844094083e+06, - "cpu_time": 2.0857112891246832e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7449449567026615e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8712472752204773e+06, - "cpu_time": 2.0790776206896969e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7511314743872721e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8757884051750812e+06, - "cpu_time": 2.0839732811670778e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7468921286429171e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8756695726527574e+06, - "cpu_time": 2.0835638673740905e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7470028025062140e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8709098785090144e+06, - "cpu_time": 2.0786844986736437e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7514472704646699e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8742993431933478e+06, - "cpu_time": 2.0822021114058387e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7482837265407469e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8756695726527576e+06, - "cpu_time": 2.0835638673740909e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7470028025062140e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0712731985992968e+03, - "cpu_time": 3.1401350076313875e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8654132807557184e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6386246998126770e-03, - "cpu_time": 1.5080836727762535e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6389864169389641e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8663469463524264e+06, - "cpu_time": 2.0859572499999108e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5114585810576662e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8718707806909424e+06, - "cpu_time": 2.0866228829786610e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5010963724648476e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8794384871766174e+06, - "cpu_time": 2.0935917872340295e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4869989333064750e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8726010131355540e+06, - "cpu_time": 2.0873962260637011e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4997310980978295e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8788699879688136e+06, - "cpu_time": 2.0932366542552323e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4880540122336447e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8738254430648710e+06, - "cpu_time": 2.0893609601063072e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4974677994320929e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8726010131355538e+06, - "cpu_time": 2.0873962260637011e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4997310980978295e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4360266788412155e+03, - "cpu_time": 3.7370908479683521e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0151940466759299e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9010315229522814e-03, - "cpu_time": 1.7886286378100069e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9026544485721176e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8680988533618646e+06, - "cpu_time": 2.1000179441490700e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0163310557211921e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8686686347249867e+06, - "cpu_time": 2.0998503909573988e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0141916851560995e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8734967753574736e+06, - "cpu_time": 2.1006653031915454e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9961155911245555e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8687984443107431e+06, - "cpu_time": 2.0998204441488669e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0137044687204048e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8689810011447333e+06, - "cpu_time": 2.1004678297872599e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0130193896952212e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8696087417799602e+06, - "cpu_time": 2.1001643824468283e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0106724380834952e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8687984443107429e+06, - "cpu_time": 2.1000179441490700e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0137044687204048e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1983522069536762e+03, - "cpu_time": 3.8122508429088157e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2311639289349594e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1758354343490798e-03, - "cpu_time": 1.8152154539766523e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1740905029625245e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8811526253897075e+06, - "cpu_time": 2.1280845493333801e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3935286082685244e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8811859068615984e+06, - "cpu_time": 2.1279340559999584e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3935039543079370e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8815233825395505e+06, - "cpu_time": 2.1285209946666630e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3932540112585586e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8802361295480903e+06, - "cpu_time": 2.1274917546666074e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3942078650674883e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8802199160757787e+06, - "cpu_time": 2.1275222933333376e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3942198875710389e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8808635920829452e+06, - "cpu_time": 2.1279107295999890e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3937428652947095e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8811526253897075e+06, - "cpu_time": 2.1279340559999580e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3935286082685244e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9807577936227335e+02, - "cpu_time": 4.2708418410152888e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4320927336868757e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1797934835877165e-04, - "cpu_time": 2.0070587462182372e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1799931278928565e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8929786468800961e+06, - "cpu_time": 2.1791895456990390e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7696456104462820e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8961580156634052e+06, - "cpu_time": 2.1824858655914459e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7650016278657472e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8989455442429993e+06, - "cpu_time": 2.1820745806452739e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7609427852708834e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8977644664431941e+06, - "cpu_time": 2.1811381747311843e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7626610639550275e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8996152229906279e+06, - "cpu_time": 2.1837831370967850e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7599694593655437e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8970923792440644e+06, - "cpu_time": 2.1817342607527459e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7636441093806976e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8977644664431941e+06, - "cpu_time": 2.1820745806452744e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7626610639550275e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6479469193376867e+03, - "cpu_time": 1.7109584290775390e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8609407674814179e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3957922915661153e-03, - "cpu_time": 7.8421944407070974e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3970470200472421e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 370, - "real_time": 1.8934762592244945e+06, - "cpu_time": 2.2667429999998873e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5378354753149235e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 370, - "real_time": 1.9015273652700204e+06, - "cpu_time": 2.2713653243243154e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5143881658053350e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 370, - "real_time": 1.8926610629785354e+06, - "cpu_time": 2.2660313972972143e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5402207004239082e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 370, - "real_time": 1.8987613451679717e+06, - "cpu_time": 2.2690271783784665e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5224212493500018e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 370, - "real_time": 1.8943688419263659e+06, - "cpu_time": 2.2668461135135596e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5352261755620563e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8961589749134774e+06, - "cpu_time": 2.2680026027026894e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5300183532912445e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8943688419263656e+06, - "cpu_time": 2.2668461135135600e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5352261755620563e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8153922945630570e+03, - "cpu_time": 2.1890276938873253e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1116827849346234e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0121689927065081e-03, - "cpu_time": 9.6517865159358607e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0102696119859973e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 364, - "real_time": 1.9380520192258940e+06, - "cpu_time": 2.4586348901098287e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0820927298110681e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 364, - "real_time": 1.9394761820676851e+06, - "cpu_time": 2.4598195054945457e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0812981460613844e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 364, - "real_time": 1.9417583997102946e+06, - "cpu_time": 2.4602398543956289e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0800272579291480e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 364, - "real_time": 1.9399575180064498e+06, - "cpu_time": 2.4597001318681720e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0810298578883765e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 364, - "real_time": 1.9395650080776168e+06, - "cpu_time": 2.4595008324175589e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0812486259888623e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9397618254175882e+06, - "cpu_time": 2.4595790428571468e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0811393235357678e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9395650080776170e+06, - "cpu_time": 2.4597001318681720e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0812486259888623e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3293203989917583e+03, - "cpu_time": 5.9302149968538220e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4074755969898414e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8530083517113485e-04, - "cpu_time": 2.4110690868324534e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8515458051829684e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 356, - "real_time": 1.9685012625865219e+06, - "cpu_time": 2.8028409073033216e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1307093267945755e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 356, - "real_time": 1.9675826253578737e+06, - "cpu_time": 2.8028866657303418e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1317041256334124e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 356, - "real_time": 1.9675610267185722e+06, - "cpu_time": 2.8043120646067862e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1317275261317358e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 356, - "real_time": 1.9678302665811370e+06, - "cpu_time": 2.8026777612359794e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1314358617357216e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 356, - "real_time": 1.9684482288672433e+06, - "cpu_time": 2.8024048342697588e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1307667321348047e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9679846820222693e+06, - "cpu_time": 2.8030244466292374e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1312687144860501e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9678302665811367e+06, - "cpu_time": 2.8028409073033216e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1314358617357216e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6008386923340839e+02, - "cpu_time": 7.4410021860781490e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9822938074746256e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3378427354456521e-04, - "cpu_time": 2.6546333532789150e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3377126373649664e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 350, - "real_time": 2.0003439698900494e+06, - "cpu_time": 3.5436564400000796e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1935827668983784e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 350, - "real_time": 1.9952031284836787e+06, - "cpu_time": 3.5391827885713871e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2043879544110394e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 350, - "real_time": 2.0035233940663082e+06, - "cpu_time": 3.5427174200000470e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1869279015378308e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 350, - "real_time": 1.9930815320861128e+06, - "cpu_time": 3.5393054171428117e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2088634433433523e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 350, - "real_time": 2.0013519413104015e+06, - "cpu_time": 3.5449319485714375e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1914706888122287e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9987007931673103e+06, - "cpu_time": 3.5419588028571522e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1970465510005665e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0003439698900494e+06, - "cpu_time": 3.5427174200000474e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1935827668983784e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3816620416344040e+03, - "cpu_time": 2.6001816449037306e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2061155633502677e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1922551172308550e-03, - "cpu_time": 7.3410838172546528e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1934747331204965e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 188, - "real_time": 3.6646647036987101e+06, - "cpu_time": 6.7922210212765569e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5781039621624651e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 188, - "real_time": 3.7328053359933039e+06, - "cpu_time": 6.9686623297871947e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.4945327950072603e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 188, - "real_time": 3.6944860934299673e+06, - "cpu_time": 6.8745376702127447e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5411501290627413e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 188, - "real_time": 3.6548331932243989e+06, - "cpu_time": 6.7903147872340363e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5904190733253841e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 188, - "real_time": 3.6396076432132022e+06, - "cpu_time": 6.7505371702127177e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6096221473994789e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6772793939119168e+06, - "cpu_time": 6.8352545957446517e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5627656213914671e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6646647036987096e+06, - "cpu_time": 6.7922210212765560e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5781039621624651e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6950385273715510e+04, - "cpu_time": 8.7162636133903579e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5602796613639385e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0048294218516647e-02, - "cpu_time": 1.2751922391913164e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9945516376824754e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 97, - "real_time": 7.3470689701972548e+06, - "cpu_time": 1.3861465773195552e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5670500897855501e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 97, - "real_time": 7.3321164134390578e+06, - "cpu_time": 1.3876749206185510e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5763637820176973e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 97, - "real_time": 7.3491820595083162e+06, - "cpu_time": 1.3844524814433115e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5657369389274454e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 97, - "real_time": 7.3406179051500624e+06, - "cpu_time": 1.3893467381443039e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5710636943054533e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 97, - "real_time": 7.3555111645039208e+06, - "cpu_time": 1.3916840824742381e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5618083161815195e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3448993025597231e+06, - "cpu_time": 1.3878609599999920e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5684045642435331e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3470689701972548e+06, - "cpu_time": 1.3876749206185510e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5670500897855501e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9077732449482210e+03, - "cpu_time": 2.8024652916552215e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5425949392969357e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2127835764669818e-03, - "cpu_time": 2.0192694891102330e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2132452065822493e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4383576886386288e+07, - "cpu_time": 2.6741641306122512e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6656589338022690e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4381203002163341e+07, - "cpu_time": 2.6737716775509935e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6664290873235655e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4367573780520838e+07, - "cpu_time": 2.6739785163265288e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6708557078011570e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4399286492594650e+07, - "cpu_time": 2.6759380306122683e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6605687048808384e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4362969587804103e+07, - "cpu_time": 2.6730821795917924e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6723529970420275e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4378921949893847e+07, - "cpu_time": 2.6741869069387667e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6671730861699715e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4381203002163341e+07, - "cpu_time": 2.6739785163265284e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6664290873235655e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4360057771318190e+04, - "cpu_time": 1.0610392888311982e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6598611195785655e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.9868806725278902e-04, - "cpu_time": 3.9677080389485792e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9843332002983289e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.7747236908628389e+07, - "cpu_time": 5.0242324346153460e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8371565227189569e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.7716018474445894e+07, - "cpu_time": 5.0120845192308344e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8426049406680994e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.7739046069865044e+07, - "cpu_time": 5.0101666499999128e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8385848475809898e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.7760393630999785e+07, - "cpu_time": 5.0207765576922938e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8348640074800758e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.7749735503815688e+07, - "cpu_time": 5.0214695538460761e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8367209835763874e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7742486117550962e+07, - "cpu_time": 5.0177459430768929e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8379862604049015e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7747236908628393e+07, - "cpu_time": 5.0207765576922946e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8371565227189569e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6644614102662716e+04, - "cpu_time": 6.2173522922803983e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9038064429159188e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.9996836736750467e-04, - "cpu_time": 1.2390727555384967e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0020973326883594e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.3590418770909309e+07, - "cpu_time": 9.3624053399997815e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0090195627602720e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.3591524064540863e+07, - "cpu_time": 9.3503911999999911e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0089162546808748e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.3575059026479721e+07, - "cpu_time": 9.3443534800002232e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0104556276330843e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.3546115756034851e+07, - "cpu_time": 9.3356494299996480e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0131639281369591e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.3651123493909836e+07, - "cpu_time": 9.3570227499998286e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0033519993383036e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3590848222374924e+07, - "cpu_time": 9.3499644399998948e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0089814745098982e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3590418770909309e+07, - "cpu_time": 9.3503911999999911e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0090195627602720e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8353754056867256e+04, - "cpu_time": 1.0502145499139026e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5833901852631122e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1567730926218179e-04, - "cpu_time": 1.1232283894268096e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1539298028921690e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 9.4750837422907352e+07, - "cpu_time": 1.7327072874999771e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6661336891805019e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 9.4940037466585636e+07, - "cpu_time": 1.7331625912499505e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6548420068714733e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 9.4903376884758472e+07, - "cpu_time": 1.7318609975000498e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6570264370247269e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 9.5178016461431980e+07, - "cpu_time": 1.7377399937500116e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6407028845526609e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 9.5206435769796371e+07, - "cpu_time": 1.7377864049999657e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6390191236454086e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4995740801095963e+07, - "cpu_time": 1.7346514549999911e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6515448282549553e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4940037466585636e+07, - "cpu_time": 1.7331625912499505e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6548420068714733e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9315046295135684e+05, - "cpu_time": 2.8788078567900800e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1491249973492004e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0332539261500074e-03, - "cpu_time": 1.6595886444462093e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0332936078010714e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.9021894410252571e+08, - "cpu_time": 3.0970684724999839e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6447680806243258e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8997678905725479e+08, - "cpu_time": 3.0744388075000018e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6519632178665676e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8961442261934280e+08, - "cpu_time": 3.0771750399999577e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6627645153110113e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8953919038176537e+08, - "cpu_time": 3.0742986949999815e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6650121900241032e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8949230760335922e+08, - "cpu_time": 3.0709498850001180e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6664137852367640e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8976833075284961e+08, - "cpu_time": 3.0787861800000083e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6581843578125553e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8961442261934280e+08, - "cpu_time": 3.0744388075000018e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6627645153110113e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1578832222947828e+05, - "cpu_time": 1.0455652535274522e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4077054440963455e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6640728248843296e-03, - "cpu_time": 3.3960307484797439e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6626721310532464e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8670792902373655e+06, - "cpu_time": 2.0685603749999690e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1938007782622166e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8627699108115034e+06, - "cpu_time": 2.0694891648935315e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1988759729405358e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8678640003890132e+06, - "cpu_time": 2.0688252606383476e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1928791384955980e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8630592680795980e+06, - "cpu_time": 2.0688544361701256e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1985344589826553e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8657218585584371e+06, - "cpu_time": 2.0669270957446946e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1953969082855699e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8652988656151835e+06, - "cpu_time": 2.0685312664893339e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1958974513933151e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8657218585584369e+06, - "cpu_time": 2.0688252606383476e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1953969082855699e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3097705943831552e+03, - "cpu_time": 9.5951180775990247e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7194757768688733e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2382844577677814e-03, - "cpu_time": 4.6386139929533923e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2384347798861661e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8696124626095062e+06, - "cpu_time": 2.0728049074073674e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3816567143364241e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8704966945127428e+06, - "cpu_time": 2.0731026084656040e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3795853924959674e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8653411385630968e+06, - "cpu_time": 2.0676225634920604e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3916899866961781e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8609660735857985e+06, - "cpu_time": 2.0684620502645874e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4020146934840474e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8653491543008140e+06, - "cpu_time": 2.0678324285714678e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3916711148217153e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8663531047143913e+06, - "cpu_time": 2.0699649116402171e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3893235803668667e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8653491543008140e+06, - "cpu_time": 2.0684620502645872e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3916711148217153e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8355197369979942e+03, - "cpu_time": 2.7478804795926508e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0248031396249517e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0550879291327587e-03, - "cpu_time": 1.3275009948913871e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0560806179777350e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8626591914056840e+06, - "cpu_time": 2.0713108862434549e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7960267104126364e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8685038509718929e+06, - "cpu_time": 2.0725636640211826e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7685128352708202e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8749948920606312e+06, - "cpu_time": 2.0791793068783721e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7381571381209902e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8733178530676505e+06, - "cpu_time": 2.0769698439154120e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7459797455997076e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8689673446782830e+06, - "cpu_time": 2.0725102539682805e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7663382919193171e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8696886264368284e+06, - "cpu_time": 2.0745067910053406e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7630029442646950e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8689673446782832e+06, - "cpu_time": 2.0725636640211828e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7663382919193171e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8131236723243910e+03, - "cpu_time": 3.3865448499849563e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2578507197889685e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5742915714778848e-03, - "cpu_time": 1.6324578278887098e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5765719059431687e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8677341489084475e+06, - "cpu_time": 2.0785402739361571e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7544252761641946e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8726145788489101e+06, - "cpu_time": 2.0783888191490246e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7498528725618690e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8682298418656152e+06, - "cpu_time": 2.0785900212765888e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7539597787003476e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8729038936223160e+06, - "cpu_time": 2.0788642313830114e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7495825659598898e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8769345608930923e+06, - "cpu_time": 2.0828368191489324e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7458253837261204e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8716834048276762e+06, - "cpu_time": 2.0794440329787428e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7507291754224844e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8726145788489103e+06, - "cpu_time": 2.0785900212765888e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7498528725618690e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7899550600108487e+03, - "cpu_time": 1.9043870735942025e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5435769779189926e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0248910954894029e-03, - "cpu_time": 9.1581549846582000e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0240577627112771e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8797907300625972e+06, - "cpu_time": 2.0919673563830149e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4863455251647957e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8728583699680227e+06, - "cpu_time": 2.0853926276596151e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4992501862871222e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8683745366867331e+06, - "cpu_time": 2.0854675531914933e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5076478892833628e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8736826393077092e+06, - "cpu_time": 2.0854255079786025e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4977107982499287e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8683728094982414e+06, - "cpu_time": 2.0857108563830254e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5076511318744756e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8726158171046611e+06, - "cpu_time": 2.0867927803191501e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4997211061719365e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8728583699680227e+06, - "cpu_time": 2.0854675531914930e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4992501862871222e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7081814585897619e+03, - "cpu_time": 2.8953792890491959e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7876115771721496e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5142271124620223e-03, - "cpu_time": 1.3874781034111025e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5109462470237266e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8812494213597483e+06, - "cpu_time": 2.1059939707446336e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9672845350438684e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8709361679902165e+06, - "cpu_time": 2.0990629335107072e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0056906399323717e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8754710984060869e+06, - "cpu_time": 2.0996693404254797e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9887507256920472e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8794996233717687e+06, - "cpu_time": 2.1039775531914197e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9737710170359373e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8711566314797234e+06, - "cpu_time": 2.0988910159575311e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0048652151769549e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8756625885215090e+06, - "cpu_time": 2.1015189627659544e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9880724265762359e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8754710984060869e+06, - "cpu_time": 2.0996693404254802e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9887507256920472e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7067745316853488e+03, - "cpu_time": 3.2569022944638891e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7532298977530014e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5093929795739350e-03, - "cpu_time": 1.5497848709284331e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5088891338408549e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8763221378127735e+06, - "cpu_time": 2.1236109786667232e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3971161706037375e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8760042761374887e+06, - "cpu_time": 2.1234445893333033e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3973528916454771e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8763899917636686e+06, - "cpu_time": 2.1231572213332583e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3970656481364191e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8765960197197271e+06, - "cpu_time": 2.1234133839999838e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3969122669201422e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8763144139666108e+06, - "cpu_time": 2.1234805493333321e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3971219218308732e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8763253678800543e+06, - "cpu_time": 2.1234213445333201e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3971137798273298e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8763221378127735e+06, - "cpu_time": 2.1234445893333033e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3971161706037375e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1251999317121854e+02, - "cpu_time": 1.6570385158742909e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5824868087917826e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1326393428839688e-04, - "cpu_time": 7.8036255976247153e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1326828434741824e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 369, - "real_time": 1.8985204291050411e+06, - "cpu_time": 2.1833960867208987e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7615610133157659e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 369, - "real_time": 1.8951526401642719e+06, - "cpu_time": 2.1810286612465950e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7664684568866950e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 369, - "real_time": 1.8962279669934162e+06, - "cpu_time": 2.1799643631436876e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7648996277134877e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 369, - "real_time": 1.9024098803873521e+06, - "cpu_time": 2.1867526531166257e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7559150391568041e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 369, - "real_time": 1.8970071383705237e+06, - "cpu_time": 2.1807198672087826e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7637639806160605e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8978636110041211e+06, - "cpu_time": 2.1823723262873180e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7625216235377628e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8970071383705239e+06, - "cpu_time": 2.1810286612465950e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7637639806160605e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8221540937959262e+03, - "cpu_time": 2.7644932541816129e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1032175677143905e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4870162836953186e-03, - "cpu_time": 1.2667376784806499e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4853159999738553e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 373, - "real_time": 1.8916318952118424e+06, - "cpu_time": 2.2629475201072870e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5432349319874990e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 373, - "real_time": 1.8976737290836780e+06, - "cpu_time": 2.2663356729222396e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5255863214501131e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 373, - "real_time": 1.8922821727073216e+06, - "cpu_time": 2.2644794798928574e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5413300147503042e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 373, - "real_time": 1.8982677927256960e+06, - "cpu_time": 2.2674526193029354e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5238570870675969e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 373, - "real_time": 1.8929380253419259e+06, - "cpu_time": 2.2645184557640627e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5394100914138126e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8945587230140928e+06, - "cpu_time": 2.2651467495978763e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5346836893338656e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8929380253419261e+06, - "cpu_time": 2.2645184557640627e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5394100914138126e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1557932509370430e+03, - "cpu_time": 1.7611917923159622e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2143052929670177e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6657141383912481e-03, - "cpu_time": 7.7751774476802441e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6648296108997727e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 363, - "real_time": 1.9407968059921067e+06, - "cpu_time": 2.4588264104682789e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0805623718697159e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 363, - "real_time": 1.9426396794581255e+06, - "cpu_time": 2.4597346969697606e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0795373028646123e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 363, - "real_time": 1.9430901344349871e+06, - "cpu_time": 2.4596828650139044e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0792870401813920e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 363, - "real_time": 1.9432020874901807e+06, - "cpu_time": 2.4594154490357400e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0792248595763190e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 363, - "real_time": 1.9409730983962186e+06, - "cpu_time": 2.4591508787878877e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0804642278313022e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9421403611543239e+06, - "cpu_time": 2.4593620600551148e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0798151604646683e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9426396794581257e+06, - "cpu_time": 2.4594154490357405e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0795373028646123e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1668647829772362e+03, - "cpu_time": 3.7952024922896987e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4888064184409135e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.0081382701078435e-04, - "cpu_time": 1.5431654224204173e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0091825490287028e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 356, - "real_time": 1.9738303623005245e+06, - "cpu_time": 2.8019953286516694e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1249566731314666e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 356, - "real_time": 1.9760834085205672e+06, - "cpu_time": 2.8026008764045541e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1225338879496720e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 356, - "real_time": 1.9750415908010527e+06, - "cpu_time": 2.8022730140449903e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1236535066073425e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 356, - "real_time": 1.9766600400973321e+06, - "cpu_time": 2.8064233033706443e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1219147020311441e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 356, - "real_time": 1.9719615906314775e+06, - "cpu_time": 2.8021695898876823e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1269704338697922e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9747153984701908e+06, - "cpu_time": 2.8030924224719079e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1240058407178838e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9750415908010527e+06, - "cpu_time": 2.8022730140449903e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1236535066073425e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8792439054526342e+03, - "cpu_time": 1.8750366726268039e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0221609800211259e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5165303663934640e-04, - "cpu_time": 6.6891717789786679e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5205057408771733e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 350, - "real_time": 1.9999032883372689e+06, - "cpu_time": 3.5363140914284936e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1945068288648782e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 350, - "real_time": 2.0029872123684201e+06, - "cpu_time": 3.5387059228569991e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1880487045551033e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 350, - "real_time": 1.9966365443542600e+06, - "cpu_time": 3.5362213457142389e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2013695600833511e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 350, - "real_time": 2.0053163396992853e+06, - "cpu_time": 3.5380761999999774e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1831843853912568e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 350, - "real_time": 1.9996321996274805e+06, - "cpu_time": 3.5370156342857429e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1950754751612563e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0008951168773430e+06, - "cpu_time": 3.5372666388570904e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1924369908111687e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9999032883372691e+06, - "cpu_time": 3.5370156342857429e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1945068288648782e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3405912108659563e+03, - "cpu_time": 1.0942937597584432e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9982924057572791e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6695483849645172e-03, - "cpu_time": 3.0936140005323866e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6692659713421771e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 193, - "real_time": 3.6235311613876587e+06, - "cpu_time": 6.6986900362694236e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6300736085225325e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 193, - "real_time": 3.6225562789742812e+06, - "cpu_time": 6.7116815129535394e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6313196284559679e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 193, - "real_time": 3.5965673775059879e+06, - "cpu_time": 6.6555278031087564e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6647856800708771e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 193, - "real_time": 3.6447673174673258e+06, - "cpu_time": 6.7583387046631398e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6030965871528234e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 193, - "real_time": 3.6350113769192151e+06, - "cpu_time": 6.7423268963730298e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6154507538898573e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6244867024508938e+06, - "cpu_time": 6.7133129906735765e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6289452516184120e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6235311613876582e+06, - "cpu_time": 6.7116815129535394e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6300736085225325e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8070697392518072e+04, - "cpu_time": 4.0077244357433010e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3139263654731970e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9857259457728427e-03, - "cpu_time": 5.9698161568081266e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9988199032256478e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 99, - "real_time": 7.2283375387390452e+06, - "cpu_time": 1.3609573505050896e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6420676704941807e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 99, - "real_time": 7.2289904805295393e+06, - "cpu_time": 1.3589767555555280e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6416483865036249e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 99, - "real_time": 7.2282680846524965e+06, - "cpu_time": 1.3653700262626568e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6421122746187067e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 99, - "real_time": 7.2317170120324148e+06, - "cpu_time": 1.3650137303030612e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6398983732591887e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 99, - "real_time": 7.2333864783021538e+06, - "cpu_time": 1.3597001131312931e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6388274842845144e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2301399188511316e+06, - "cpu_time": 1.3620035951515257e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6409108378320436e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2289904805295393e+06, - "cpu_time": 1.3609573505050894e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6416483865036249e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2967867189982244e+03, - "cpu_time": 2.9981739138543089e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4740366936002644e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1766836392886622e-04, - "cpu_time": 2.2012966225105706e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1761797308927535e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4320635179779967e+07, - "cpu_time": 2.6716827979591511e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6861653241997547e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4323028830849394e+07, - "cpu_time": 2.6653343346938577e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6853821766705379e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4295906949864358e+07, - "cpu_time": 2.6659620448979191e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6942711809296398e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4315603376955403e+07, - "cpu_time": 2.6654741693877839e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6878124681792145e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4320383665665071e+07, - "cpu_time": 2.6699676408163805e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6862476290284023e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4315111600622838e+07, - "cpu_time": 2.6676841975510191e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6879757558015108e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4320383665665071e+07, - "cpu_time": 2.6659620448979191e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6862476290284023e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1068509224213660e+04, - "cpu_time": 2.9400173491959675e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6280083305747798e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7320453608842820e-04, - "cpu_time": 1.1020859785033608e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7389656422284406e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.7537315367506102e+07, - "cpu_time": 4.9884253153845310e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8740309724736738e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.7598084595340949e+07, - "cpu_time": 4.9912863000000790e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8632986661204147e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.7612626337661192e+07, - "cpu_time": 4.9890672115382656e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8607374886661482e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.7461407634501275e+07, - "cpu_time": 4.9731827884615906e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8875035754312496e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.7600921618823823e+07, - "cpu_time": 4.9920327769231014e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8627987809096756e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7562071110766672e+07, - "cpu_time": 4.9867988784615144e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8696738967202330e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7598084595340949e+07, - "cpu_time": 4.9890672115382656e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8632986661204147e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3458936114597273e+04, - "cpu_time": 7.7575637936477040e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1232227334223609e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3024008558561507e-03, - "cpu_time": 1.5556199443200731e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3065666351475013e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.5961602528889976e+07, - "cpu_time": 9.4062428800001875e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.8404285584096022e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.5911916593710579e+07, - "cpu_time": 9.3949280466665640e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.8467490777061710e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5977101226647697e+07, - "cpu_time": 9.4076618733333811e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.8384597731972389e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.5911958316961922e+07, - "cpu_time": 9.4025856133331820e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.8467437643762627e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.5990934967994690e+07, - "cpu_time": 9.4034116999997273e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.8367036066304264e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5950702726840973e+07, - "cpu_time": 9.4029660226666078e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.8418169560639410e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5961602528889969e+07, - "cpu_time": 9.4034116999997258e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.8404285584096022e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6877544389991221e+04, - "cpu_time": 4.9432075910834610e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6889212850377429e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0254581979330875e-04, - "cpu_time": 5.2570726929858727e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0264775844620295e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 9.9065597686502665e+07, - "cpu_time": 1.7557119044444865e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4193476296277037e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 9.9016334447595805e+07, - "cpu_time": 1.7433187711111486e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4220438980614643e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 9.8973720437950552e+07, - "cpu_time": 1.7495808200000182e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4243784069588413e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 9.8947587112585708e+07, - "cpu_time": 1.7493660744443989e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4258110547873316e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 9.8818984296586782e+07, - "cpu_time": 1.7428602655555400e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4328721937546120e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8964444796244308e+07, - "cpu_time": 1.7481675671111184e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4248906366379910e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8973720437950566e+07, - "cpu_time": 1.7493660744443992e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4243784069588413e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2808161157102702e+04, - "cpu_time": 5.2921876811289147e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0902762701920215e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.3779297552957878e-04, - "cpu_time": 3.0272771218804611e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3831868900985942e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.9238923862576485e+08, - "cpu_time": 3.1406285850002289e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5810908742595549e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.9199131801724434e+08, - "cpu_time": 3.1226287100000149e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5926582258451824e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.9233843684196472e+08, - "cpu_time": 3.1326795974999303e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5825649913243408e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.9228979945182800e+08, - "cpu_time": 3.1257211150000328e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5839770339403334e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.9205844029784203e+08, - "cpu_time": 3.1155585950000387e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5907036542359371e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9221344664692879e+08, - "cpu_time": 3.1274433205000496e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5861989559210701e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9228979945182800e+08, - "cpu_time": 3.1257211150000328e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5839770339403334e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7728734857977860e+05, - "cpu_time": 9.6002989928890741e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1538725506321946e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.2234623369213346e-04, - "cpu_time": 3.0696955976660433e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2260812607996483e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8639886515899058e+06, - "cpu_time": 2.0652947857145052e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1974382711537867e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8664766885098452e+06, - "cpu_time": 2.0679924391533714e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1945090582782249e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8638659039521208e+06, - "cpu_time": 2.0649462486772868e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1975829866917394e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8625787057442327e+06, - "cpu_time": 2.0677845343912949e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1991017009739499e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8646553246418035e+06, - "cpu_time": 2.0659817592592880e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1966526177092986e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8643130548875816e+06, - "cpu_time": 2.0663999534391493e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1970569269613996e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8639886515899054e+06, - "cpu_time": 2.0659817592592877e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1974382711537867e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4240441921017978e+03, - "cpu_time": 1.4109052741708197e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6776742680589196e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.6384392008007913e-04, - "cpu_time": 6.8278421697727152e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6360072762392966e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8637917160192861e+06, - "cpu_time": 2.0663444157892889e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3953409222660325e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8673588665957430e+06, - "cpu_time": 2.0699726157895264e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3869446556538371e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8637276698044795e+06, - "cpu_time": 2.0662974868421792e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3954919663018193e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8663908518838549e+06, - "cpu_time": 2.0687060052631225e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3892199705819106e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8638868414104525e+06, - "cpu_time": 2.0664696500001643e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3951166014997438e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8650311891427631e+06, - "cpu_time": 2.0675580347368564e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3924228232606687e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8638868414104525e+06, - "cpu_time": 2.0664696500001638e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3951166014997438e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7184115571057398e+03, - "cpu_time": 1.6877848845477645e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0453667206196369e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.2138489002727348e-04, - "cpu_time": 8.1631802164265415e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2098754682651469e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8685889693362231e+06, - "cpu_time": 2.0731623085106565e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7681134100989960e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8630114517052672e+06, - "cpu_time": 2.0711413882980153e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7943635477942228e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8647127153405775e+06, - "cpu_time": 2.0690714414895605e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7863400432744771e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8674540294941447e+06, - "cpu_time": 2.0720021276595599e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7734422059310842e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8648582793870680e+06, - "cpu_time": 2.0692311808509300e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7856542135657668e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8657250890526562e+06, - "cpu_time": 2.0709216893617448e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7815826841329094e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8648582793870675e+06, - "cpu_time": 2.0711413882980153e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7856542135657668e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2545028559901111e+03, - "cpu_time": 1.7689845195933565e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0609536067444526e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2083789134951608e-03, - "cpu_time": 8.5420155126124310e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2081576236382164e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8717140183674139e+06, - "cpu_time": 2.0780755013263612e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7506948005113304e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8720959810140501e+06, - "cpu_time": 2.0784891458883169e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7503376072764549e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8686485232728834e+06, - "cpu_time": 2.0749204827585774e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7535667939633615e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8662506171294663e+06, - "cpu_time": 2.0760886445623811e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7558199150337804e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8697693642594453e+06, - "cpu_time": 2.0756915305038870e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7525156110886615e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8696957008086522e+06, - "cpu_time": 2.0766530610079046e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7525869455747180e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8697693642594453e+06, - "cpu_time": 2.0760886445623811e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7525156110886615e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3877583358566435e+03, - "cpu_time": 1.5523754675648288e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2392531520366898e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2770839312642838e-03, - "cpu_time": 7.4753722550621054e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2776844867473218e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8744713320941553e+06, - "cpu_time": 2.0870646525197262e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4962391196873263e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8724966032882296e+06, - "cpu_time": 2.0848250106098626e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4999262420510881e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8762211725914008e+06, - "cpu_time": 2.0885628726789861e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4929783842852026e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8782413347733244e+06, - "cpu_time": 2.0909736312997383e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4892214747211494e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8752102160309714e+06, - "cpu_time": 2.0874977427056436e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4948615061788678e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8753281317556165e+06, - "cpu_time": 2.0877847819627915e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4946453453847267e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8752102160309714e+06, - "cpu_time": 2.0874977427056439e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4948615061788678e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1242549868000492e+03, - "cpu_time": 2.2436248386008642e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9582775266680073e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1327377597708172e-03, - "cpu_time": 1.0746437362626825e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1326693084594652e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8741738105668349e+06, - "cpu_time": 2.1035854069149285e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9935882819938615e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8774260984850735e+06, - "cpu_time": 2.1036379547872893e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9814732044986576e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8744180574201969e+06, - "cpu_time": 2.1035378989361012e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9926769794566154e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8767654669608553e+06, - "cpu_time": 2.1023755851061614e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9839307205631688e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8788067509957089e+06, - "cpu_time": 2.1048947819148805e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9763428266656980e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8763180368857342e+06, - "cpu_time": 2.1036063255318720e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9856024026356012e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8767654669608555e+06, - "cpu_time": 2.1035854069149285e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9839307205631688e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9893039345038155e+03, - "cpu_time": 8.9176258630354312e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4062212303238688e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0602168158046451e-03, - "cpu_time": 4.2392085224314551e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0602122484854809e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 374, - "real_time": 1.8849163934841184e+06, - "cpu_time": 2.1306292727272948e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3907460347111079e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 374, - "real_time": 1.8847020789853267e+06, - "cpu_time": 2.1301222032086095e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3909041801510152e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 374, - "real_time": 1.8878926385759332e+06, - "cpu_time": 2.1334311336896792e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3885535365916747e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 374, - "real_time": 1.8858160739696093e+06, - "cpu_time": 2.1312160989305452e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3900825410199818e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 374, - "real_time": 1.8896236125878457e+06, - "cpu_time": 2.1346341417113687e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3872815636601457e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8865901595205669e+06, - "cpu_time": 2.1320065700534997e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3895135712267852e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8858160739696093e+06, - "cpu_time": 2.1312160989305452e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3900825410199818e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1132817190626965e+03, - "cpu_time": 1.9368883095076144e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5556357480142967e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1201594095029831e-03, - "cpu_time": 9.0848139809391454e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1195541952431917e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 370, - "real_time": 1.9110426122662486e+06, - "cpu_time": 2.1948642837837478e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7434657743097758e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 370, - "real_time": 1.9093984511454364e+06, - "cpu_time": 2.1946339594595321e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7458281412425095e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 370, - "real_time": 1.9078443045539127e+06, - "cpu_time": 2.1926585243243831e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7480649167678684e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 370, - "real_time": 1.9078737242002594e+06, - "cpu_time": 2.1930930405405150e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7480225412704951e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 370, - "real_time": 1.9066027824206881e+06, - "cpu_time": 2.1919046783781401e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7498543736223125e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9085523749173090e+06, - "cpu_time": 2.1934308972972636e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7470471494425923e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9078737242002594e+06, - "cpu_time": 2.1930930405405154e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7480225412704951e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7087984355574804e+03, - "cpu_time": 1.2788673471747002e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4586569492306162e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.9533745995915698e-04, - "cpu_time": 5.8304428407136746e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9501811052988519e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 368, - "real_time": 1.9222639050934482e+06, - "cpu_time": 2.2832516929348093e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4549013651121163e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 368, - "real_time": 1.9147634084220042e+06, - "cpu_time": 2.2780098749999697e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4762692632827830e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 368, - "real_time": 1.9153294891546702e+06, - "cpu_time": 2.2765256494565732e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4746507373140717e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 368, - "real_time": 1.9157951501256321e+06, - "cpu_time": 2.2788846141303363e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4733200464112127e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 368, - "real_time": 1.9156942877958973e+06, - "cpu_time": 2.2766998070653328e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4736082196415555e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9167692481183310e+06, - "cpu_time": 2.2786743277174039e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4705499263523483e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9156942877958971e+06, - "cpu_time": 2.2780098749999697e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4736082196415555e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0980623228453123e+03, - "cpu_time": 2.7364913755485304e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8237131825552892e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6162938370837504e-03, - "cpu_time": 1.2009137691430135e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6129481133240954e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 359, - "real_time": 1.9601109346198465e+06, - "cpu_time": 2.4685241030640788e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0699149537710896e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 359, - "real_time": 1.9619637005184169e+06, - "cpu_time": 2.4714361420611469e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0689045875037657e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 359, - "real_time": 1.9619449216568931e+06, - "cpu_time": 2.4699144038997153e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0689148185816157e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 359, - "real_time": 1.9594253878132508e+06, - "cpu_time": 2.4675389136491558e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0702892863608625e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 359, - "real_time": 1.9606510185361593e+06, - "cpu_time": 2.4688701337048477e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0696202333680747e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9608191926289133e+06, - "cpu_time": 2.4692567392757894e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0695287759170817e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9606510185361591e+06, - "cpu_time": 2.4688701337048477e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0696202333680747e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1235844373091304e+03, - "cpu_time": 1.4848791049676195e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1286799557490356e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7301787004783249e-04, - "cpu_time": 6.0134658391298806e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7302618627478414e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 346, - "real_time": 2.0320174924227158e+06, - "cpu_time": 2.8737728959540119e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0641082154264591e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 346, - "real_time": 2.0318283568906216e+06, - "cpu_time": 2.8757037427746155e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0643003557735019e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 346, - "real_time": 2.0314583728477531e+06, - "cpu_time": 2.8768404710981906e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0646763212382796e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 346, - "real_time": 2.0318870549426668e+06, - "cpu_time": 2.8766681820809282e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0642407213516843e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 346, - "real_time": 2.0327097033096661e+06, - "cpu_time": 2.8744909450866631e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0634053122149303e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0319801960826847e+06, - "cpu_time": 2.8754952473988822e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0641461852009709e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0318870549426668e+06, - "cpu_time": 2.8757037427746155e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0642407213516843e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5760291471792641e+02, - "cpu_time": 1.3420125300773536e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6478068944395700e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2520047961102559e-04, - "cpu_time": 4.6670657212572776e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2516849473948702e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 327, - "real_time": 2.1417730470794602e+06, - "cpu_time": 3.7020312629969595e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9166652187722578e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 327, - "real_time": 2.1495386934625586e+06, - "cpu_time": 3.7097361498473673e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9025154678594375e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 327, - "real_time": 2.1446041509349593e+06, - "cpu_time": 3.7029459449541336e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9114948072551808e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 327, - "real_time": 2.1455915654021162e+06, - "cpu_time": 3.7045710152902422e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9096947132283525e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 327, - "real_time": 2.1377529732495639e+06, - "cpu_time": 3.7017068012234550e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9240305615146041e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1438520860257321e+06, - "cpu_time": 3.7041982348624319e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9128801537259660e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1446041509349593e+06, - "cpu_time": 3.7029459449541336e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9114948072551808e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4002975428615928e+03, - "cpu_time": 3.2893276780297406e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0335428113479298e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0525191880279648e-03, - "cpu_time": 8.8799990429019285e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0531021896231963e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 177, - "real_time": 3.9675992671505543e+06, - "cpu_time": 7.0536578248587018e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.2285560789633479e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 177, - "real_time": 3.9659306370142824e+06, - "cpu_time": 7.0523577570624296e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.2303352064247360e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 177, - "real_time": 3.9842628931763484e+06, - "cpu_time": 7.0695491694915406e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.2108707306271167e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 177, - "real_time": 3.9656394645361239e+06, - "cpu_time": 7.0496105706212604e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.2306458138807368e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 177, - "real_time": 3.9674536953811762e+06, - "cpu_time": 7.0574188361582719e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.2287112309670238e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9701771914516971e+06, - "cpu_time": 7.0565188316384424e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.2258238121725922e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9674536953811767e+06, - "cpu_time": 7.0536578248587009e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.2287112309670238e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9229777825477886e+03, - "cpu_time": 7.8074273029595224e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4113241438051835e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9956232179276479e-03, - "cpu_time": 1.1064134439710306e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9904578415162865e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 92, - "real_time": 7.7330696588868033e+06, - "cpu_time": 1.3808800032608282e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.3390831170697422e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 92, - "real_time": 7.8457016953388629e+06, - "cpu_time": 1.3913975760869868e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2767917138545694e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 92, - "real_time": 7.7325444587546848e+06, - "cpu_time": 1.3845255500000250e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.3393778308005867e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 92, - "real_time": 7.7584001954401964e+06, - "cpu_time": 1.3856530902173696e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.3249163686762085e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 92, - "real_time": 7.6930886134505272e+06, - "cpu_time": 1.3769375510868849e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.3616333680771246e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7525609243742153e+06, - "cpu_time": 1.3838787541304190e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.3283604796956472e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7330696588868024e+06, - "cpu_time": 1.3845255500000250e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.3390831170697422e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.7067557323099114e+04, - "cpu_time": 5.4146122560091244e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1680599702040996e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.3611233603695413e-03, - "cpu_time": 3.9126348604227815e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3193071257938863e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 47, - "real_time": 1.5111502933692425e+07, - "cpu_time": 2.6988733276597332e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4409126143485622e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 47, - "real_time": 1.5111026354134083e+07, - "cpu_time": 2.6984515382979866e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4410526742043781e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 47, - "real_time": 1.5106583846376298e+07, - "cpu_time": 2.6987549170211848e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4423586882680817e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 47, - "real_time": 1.5117157587504134e+07, - "cpu_time": 2.7048439361702219e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4392514671853590e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 47, - "real_time": 1.5135530422025539e+07, - "cpu_time": 2.7081101276595060e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4338627143414669e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5116360228746494e+07, - "cpu_time": 2.7018067693617266e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4394876316695700e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5111502933692425e+07, - "cpu_time": 2.6988733276597332e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4409126143485622e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1355101024056668e+04, - "cpu_time": 4.4196483589654214e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3323553370191483e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.5117957313976204e-04, - "cpu_time": 1.6358121569180601e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5061710122749923e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27, - "real_time": 2.6227649922172230e+07, - "cpu_time": 5.0114047481483966e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1174134319421253e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27, - "real_time": 2.6252597846366741e+07, - "cpu_time": 5.0199289259260833e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1125503382734833e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27, - "real_time": 2.6204787746623710e+07, - "cpu_time": 5.0047507074071757e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1218780818895559e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27, - "real_time": 2.6195371316538915e+07, - "cpu_time": 5.0038670481479101e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1237192394848490e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27, - "real_time": 2.6193670652530812e+07, - "cpu_time": 5.0060795333331920e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1240519047692919e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6214815496846482e+07, - "cpu_time": 5.0092061925925508e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1199225992718611e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6204787746623710e+07, - "cpu_time": 5.0060795333331920e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1218780818895559e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5089663067190530e+04, - "cpu_time": 6.6697913466625032e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8973387158006541e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5707952131910648e-04, - "cpu_time": 1.3315066480045423e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5652592804765018e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.4834676906466484e+07, - "cpu_time": 9.4406130099991962e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8953594904530973e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.4790101200342178e+07, - "cpu_time": 9.4507421200000852e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8993422191073370e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.4820037260651588e+07, - "cpu_time": 9.4570215999999613e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8966667921744747e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.4824643582105637e+07, - "cpu_time": 9.4585917400002018e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8962553782586813e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.4862899705767632e+07, - "cpu_time": 9.4354506199999839e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8928411994195032e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4826471731066704e+07, - "cpu_time": 9.4484838179998860e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8960930158826189e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4824643582105637e+07, - "cpu_time": 9.4507421200000852e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8962553782586813e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6276806725520517e+04, - "cpu_time": 1.0148615733838618e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3465545081075784e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7927225473148779e-04, - "cpu_time": 1.0740999222017971e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7927081869063813e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.1086676269769669e+08, - "cpu_time": 1.8505674387500903e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.8424874952279434e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.1094672884792089e+08, - "cpu_time": 1.8512826562499639e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.8389972158251762e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.1101074330508709e+08, - "cpu_time": 1.8540257287499174e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.8362068031968374e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.1111070495098829e+08, - "cpu_time": 1.8563250799999765e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.8318558705645647e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.1100906413048506e+08, - "cpu_time": 1.8502380837500709e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.8362799579044981e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1098880078643560e+08, - "cpu_time": 1.8524877975000042e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.8371654685438042e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1100906413048506e+08, - "cpu_time": 1.8512826562499639e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.8362799579044981e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0022282909635222e+04, - "cpu_time": 2.6120549683511429e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9234635585207110e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.1109339205183320e-04, - "cpu_time": 1.4100254651481113e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1110798959330274e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 2.1601998060941696e+08, - "cpu_time": 3.3632168775000083e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9705671714757681e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 2.1577393636107445e+08, - "cpu_time": 3.3416782349999607e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9762350453819809e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 2.1595014259219170e+08, - "cpu_time": 3.3811726425000191e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9721746469401236e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 2.1559766307473183e+08, - "cpu_time": 3.3454117850001806e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9803036298580513e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 2.1577141061425209e+08, - "cpu_time": 3.3467933274999952e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9762932954987011e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1582262665033340e+08, - "cpu_time": 3.3556545735000336e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9751147578309250e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1577393636107445e+08, - "cpu_time": 3.3467933274999952e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9762350453819809e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6644168463491328e+05, - "cpu_time": 1.6485863050275822e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8370946655822815e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7119664058474728e-04, - "cpu_time": 4.9128605728570706e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7125751914418090e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8651022260452958e+06, - "cpu_time": 2.0669402189973653e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1961262727593379e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8696540108758104e+06, - "cpu_time": 2.0714253693931894e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1907796716256035e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8654636094407460e+06, - "cpu_time": 2.0669510052769661e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1957008323673247e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8700166547205301e+06, - "cpu_time": 2.0713169313984744e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1903548236644655e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8660478902618843e+06, - "cpu_time": 2.0670045118734532e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1950133334601396e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8672568782688535e+06, - "cpu_time": 2.0687276073878896e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1935949867753745e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8660478902618843e+06, - "cpu_time": 2.0670045118734532e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1950133334601396e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3813127729268099e+03, - "cpu_time": 2.4136408773696648e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7963528960134786e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2753000407391944e-03, - "cpu_time": 1.1667272524183527e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2747808564807898e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8648549035812416e+06, - "cpu_time": 2.0679735119999046e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3928350587856434e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8606232092715800e+06, - "cpu_time": 2.0687425786666912e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4028258699444616e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8655226393602788e+06, - "cpu_time": 2.0678672079999766e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3912627095263684e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8696528168705604e+06, - "cpu_time": 2.0726634346665379e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3815621414203709e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8648084123657707e+06, - "cpu_time": 2.0677338879998690e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3929445757954838e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8650923962898864e+06, - "cpu_time": 2.0689961242665965e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3922860710944654e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8648549035812418e+06, - "cpu_time": 2.0679735119999046e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3928350587856434e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2051999637651502e+03, - "cpu_time": 2.0872756832840646e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5477200578246848e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7185207393162168e-03, - "cpu_time": 1.0088349894922825e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7184035683595516e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8711508736097519e+06, - "cpu_time": 2.0750059179894375e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7561084630191363e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8714133419043189e+06, - "cpu_time": 2.0755244285714258e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7548804067667462e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8660287680667974e+06, - "cpu_time": 2.0705873624338801e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7801433077442832e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8615732848172742e+06, - "cpu_time": 2.0710302275131859e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8011576732571106e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8665286814635335e+06, - "cpu_time": 2.0704858756615492e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7777917171641886e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8673389899723355e+06, - "cpu_time": 2.0725267624338958e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7740163135902938e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8665286814635335e+06, - "cpu_time": 2.0710302275131859e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7777917171641886e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0849552563674129e+03, - "cpu_time": 2.5148718896573614e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9204954934168356e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1875809792992820e-03, - "cpu_time": 1.2134327697192158e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1888442245566971e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8746223941558679e+06, - "cpu_time": 2.0818033448276476e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7479786917170193e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8692842521372780e+06, - "cpu_time": 2.0766075729444970e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7529704196958888e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8746113732995389e+06, - "cpu_time": 2.0812850530502081e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7479889680987280e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8744564772906543e+06, - "cpu_time": 2.0810801061007148e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7481334134448923e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8694892260534700e+06, - "cpu_time": 2.0764142413795153e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7527782210959256e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8724927445873623e+06, - "cpu_time": 2.0794380636605166e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7499699428104907e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8744564772906541e+06, - "cpu_time": 2.0810801061007145e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7481334134448923e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8370666372754395e+03, - "cpu_time": 2.6859545354842626e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6528979581888369e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5151282404037506e-03, - "cpu_time": 1.2916732565508931e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5159677279532149e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8652612754705471e+06, - "cpu_time": 2.0839256843501593e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5135024171596184e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8704377289395777e+06, - "cpu_time": 2.0838542811671549e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5037787671848796e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8759414295644921e+06, - "cpu_time": 2.0900922413792510e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4934992621392481e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8696097635237291e+06, - "cpu_time": 2.0836235517240444e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5053304319764383e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8762865145700003e+06, - "cpu_time": 2.0899620265253065e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4928567407531187e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8715073424136695e+06, - "cpu_time": 2.0862915570291833e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5017935238426603e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8704377289395779e+06, - "cpu_time": 2.0839256843501590e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5037787671848796e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6438089496794209e+03, - "cpu_time": 3.4122378039111354e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6920935652393324e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4813201874433117e-03, - "cpu_time": 1.6355517484670549e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4821833457790922e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8671045489757857e+06, - "cpu_time": 2.0979116781916218e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0200675196201801e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8674611559269601e+06, - "cpu_time": 2.0980959601063617e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0187269804248869e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8714126523031774e+06, - "cpu_time": 2.0976851329787727e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0039069062981695e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8679820252068471e+06, - "cpu_time": 2.0979832207447235e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0167698741900921e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8685143988593754e+06, - "cpu_time": 2.0984809627659395e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0147706691482916e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8684949562544290e+06, - "cpu_time": 2.0980313909574840e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0148483899363235e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8679820252068471e+06, - "cpu_time": 2.0979832207447235e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0167698741900921e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7159838303355587e+03, - "cpu_time": 2.9275846981742723e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4361670532623684e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.1837755547138705e-04, - "cpu_time": 1.3953960416379676e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1750622329854687e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8795345825678173e+06, - "cpu_time": 2.1262997872340409e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3947282610882279e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8800073067587677e+06, - "cpu_time": 2.1262349335104390e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3943775593720973e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8794826666364432e+06, - "cpu_time": 2.1259200585107952e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3947667869113034e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8794409095673782e+06, - "cpu_time": 2.1262278962767404e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3947977755807284e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8793460398267191e+06, - "cpu_time": 2.1259659175530518e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3948681852341062e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8795623010714252e+06, - "cpu_time": 2.1261297186170137e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3947077136372930e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8794826666364432e+06, - "cpu_time": 2.1262278962767404e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3947667869113034e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5818832285281144e+02, - "cpu_time": 1.7350828981279466e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9155676182270363e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3736619568589656e-04, - "cpu_time": 8.1607574690060222e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3734545234796039e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 371, - "real_time": 1.9012148767544054e+06, - "cpu_time": 2.1847029892182150e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7576472623390186e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 371, - "real_time": 1.8991115841119627e+06, - "cpu_time": 2.1846381239892822e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7607013952535105e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 371, - "real_time": 1.8963535885656669e+06, - "cpu_time": 2.1813069973044344e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7647164703949142e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 371, - "real_time": 1.8964036459773476e+06, - "cpu_time": 2.1810521239890684e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7646434930249155e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 371, - "real_time": 1.8957886596824068e+06, - "cpu_time": 2.1806563126682951e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7655403323692822e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8977744710183584e+06, - "cpu_time": 2.1824713094338593e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7626497906763285e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8964036459773481e+06, - "cpu_time": 2.1813069973044344e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7646434930249155e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3165587598575698e+03, - "cpu_time": 2.0211013887203985e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3698212071265740e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2206712626998766e-03, - "cpu_time": 9.2606092001487953e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2197786409625243e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 373, - "real_time": 1.8895772387505819e+06, - "cpu_time": 2.2630672064344287e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5492624408057272e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 373, - "real_time": 1.8970865201349834e+06, - "cpu_time": 2.2666657587132524e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5272966671303463e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 373, - "real_time": 1.8899439918794907e+06, - "cpu_time": 2.2628797774800891e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5481855785431170e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 373, - "real_time": 1.8950356948457847e+06, - "cpu_time": 2.2655061823054873e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5332783590935552e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 373, - "real_time": 1.8903365102471740e+06, - "cpu_time": 2.2634388954422888e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5470335271834314e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8923959911716029e+06, - "cpu_time": 2.2643115640751095e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5410113145512354e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8903365102471740e+06, - "cpu_time": 2.2634388954422893e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5470335271834314e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4339563503345839e+03, - "cpu_time": 1.6829538355140235e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0046247399701044e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8146077070310131e-03, - "cpu_time": 7.4325188380224081e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8130710856551799e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 363, - "real_time": 1.9385193712873380e+06, - "cpu_time": 2.4587495426997147e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0818318511861539e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 363, - "real_time": 1.9387349209904710e+06, - "cpu_time": 2.4596245179062192e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0817115724766519e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 363, - "real_time": 1.9390527826038601e+06, - "cpu_time": 2.4596257079891190e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0815342515760896e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 363, - "real_time": 1.9381112259037832e+06, - "cpu_time": 2.4595376060607266e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0820596733410139e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 363, - "real_time": 1.9360554690624154e+06, - "cpu_time": 2.4581431460055732e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0832086340044792e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9380947539695739e+06, - "cpu_time": 2.4591361041322704e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0820691965168779e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9385193712873380e+06, - "cpu_time": 2.4595376060607270e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0818318511861539e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1902611897534348e+03, - "cpu_time": 6.6611923428011551e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6498164040821453e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1413983362555496e-04, - "cpu_time": 2.7087530176177948e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1454631787759447e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 356, - "real_time": 1.9695095981476475e+06, - "cpu_time": 2.8057177078651651e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1296184613392107e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 356, - "real_time": 1.9673136386005313e+06, - "cpu_time": 2.8060245196631253e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1319955891647563e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 356, - "real_time": 1.9673387741727568e+06, - "cpu_time": 2.8042513876406127e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1319683498657503e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 356, - "real_time": 1.9713589775093487e+06, - "cpu_time": 2.8055323314606412e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1276206149420645e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 356, - "real_time": 1.9696241625966611e+06, - "cpu_time": 2.8055670028089006e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1294945907194927e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9690290302053890e+06, - "cpu_time": 2.8054185898876889e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1301395212062550e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9695095981476470e+06, - "cpu_time": 2.8055670028089006e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1296184613392107e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7185252661459799e+03, - "cpu_time": 6.8079862672729882e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8588928166196134e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7277802398206443e-04, - "cpu_time": 2.4267274380417988e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7266247028127059e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 352, - "real_time": 1.9947554296364121e+06, - "cpu_time": 3.5499602755683796e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2053315786833119e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 352, - "real_time": 1.9932594490951903e+06, - "cpu_time": 3.5463814886362855e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2084877629993834e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 352, - "real_time": 1.9955840361944863e+06, - "cpu_time": 3.5525892159087909e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2035854405794911e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 352, - "real_time": 1.9884335197275504e+06, - "cpu_time": 3.5476306221592068e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2187017653722630e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 352, - "real_time": 1.9994326916771985e+06, - "cpu_time": 3.5502105227274555e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1954940693519044e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9942930252661675e+06, - "cpu_time": 3.5493544250000240e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2063201233972712e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9947554296364118e+06, - "cpu_time": 3.5499602755683800e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.2053315786833119e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9905758572850382e+03, - "cpu_time": 2.4173165543627188e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4211471364511847e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0009977504446409e-03, - "cpu_time": 6.8105809251852963e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0020224066183939e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 194, - "real_time": 3.6265582311898470e+06, - "cpu_time": 6.6761092628863929e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6262089095135031e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 194, - "real_time": 3.6076105166149815e+06, - "cpu_time": 6.6595920773195140e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6505064564846792e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 194, - "real_time": 3.6097919657231146e+06, - "cpu_time": 6.6643851443297258e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6476960886689720e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 194, - "real_time": 3.6105515876996149e+06, - "cpu_time": 6.6679361907213163e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6467182624273872e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 194, - "real_time": 3.6093301185377939e+06, - "cpu_time": 6.6568106237112479e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6482908043880339e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6127684839530699e+06, - "cpu_time": 6.6649666597936405e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6438841042965155e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6097919657231146e+06, - "cpu_time": 6.6643851443297267e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6476960886689720e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7839322070223525e+03, - "cpu_time": 7.5617613551065424e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9781103169046994e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1545615894282880e-03, - "cpu_time": 1.1345535155821273e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1486561879683788e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 99, - "real_time": 7.2382099249146199e+06, - "cpu_time": 1.3781538121212739e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6357362314820948e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 99, - "real_time": 7.2820323632296287e+06, - "cpu_time": 1.3688128595960064e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6078389007761002e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 99, - "real_time": 7.2504750434121098e+06, - "cpu_time": 1.3610259646464678e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6278942826633215e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 99, - "real_time": 7.2533518282903563e+06, - "cpu_time": 1.3660465363635913e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6260587924505672e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 99, - "real_time": 7.2462423375309119e+06, - "cpu_time": 1.3733596636363858e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6305975479469481e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2540622994755264e+06, - "cpu_time": 1.3694797672727451e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6256251510638075e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2504750434121089e+06, - "cpu_time": 1.3688128595960062e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6278942826633215e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6644422683135090e+04, - "cpu_time": 6.5952875030991097e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0590637142049575e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2944967931056363e-03, - "cpu_time": 4.8159072231007223e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2895580156584729e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4361083982702421e+07, - "cpu_time": 2.6715328857142836e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6729664752905149e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4313158864269450e+07, - "cpu_time": 2.6653814653061591e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6886130892829475e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4375549474997180e+07, - "cpu_time": 2.6716058795918055e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6682642716871290e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4347493800581718e+07, - "cpu_time": 2.6715928571427271e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6773927859985609e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4337142758375527e+07, - "cpu_time": 2.6696142020406503e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6807697412928448e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4346885776185263e+07, - "cpu_time": 2.6699454579591252e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6776012727104006e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4347493800581718e+07, - "cpu_time": 2.6715328857142832e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6773927859985609e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3748670356326933e+04, - "cpu_time": 2.6893591416728799e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7460263890900863e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6553188424869125e-03, - "cpu_time": 1.0072711911233549e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6559826153377348e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.7541461114126902e+07, - "cpu_time": 4.9950500192306451e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8732972968945141e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.7556796629841510e+07, - "cpu_time": 4.9957835884618774e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8705852789382048e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.7541135294506185e+07, - "cpu_time": 4.9992874269229598e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8733549494153681e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.7561646098127730e+07, - "cpu_time": 4.9988129230769120e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8697283000494461e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.7547787373455670e+07, - "cpu_time": 4.9956965384616032e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8721781600989380e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7549765302011602e+07, - "cpu_time": 4.9969260992308006e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8718287970792942e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7547787373455673e+07, - "cpu_time": 4.9957835884618782e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8721781600989380e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1915947150385273e+03, - "cpu_time": 1.9667739674838256e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6252778468188138e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.3363604423763938e-04, - "cpu_time": 3.9359676897894895e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3360734018263996e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.3412785008549690e+07, - "cpu_time": 9.3482218299993739e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0256779525170240e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.3487505018711090e+07, - "cpu_time": 9.3461545500008464e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0186572715645542e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.3372624516487122e+07, - "cpu_time": 9.3388184000002638e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0294595484447031e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.3348928317427635e+07, - "cpu_time": 9.3317192599999994e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0316935028722868e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.3415488079190254e+07, - "cpu_time": 9.3334223600004405e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0254236299785452e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3407466188073158e+07, - "cpu_time": 9.3396672800001860e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0261823810754232e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3412785008549690e+07, - "cpu_time": 9.3388184000002638e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0256779525170240e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2771866018403824e+04, - "cpu_time": 7.3850464226993747e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9641140692776190e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.8809903904762894e-04, - "cpu_time": 7.9071836300995374e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.8765100287018953e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 1.0523140927155812e+08, - "cpu_time": 1.8242087822222352e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1018124314439373e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 1.0526143511136372e+08, - "cpu_time": 1.8228022211111590e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1003571386995173e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 1.0527157038450241e+08, - "cpu_time": 1.8203676633332735e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0998660895727987e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 1.0538518594370948e+08, - "cpu_time": 1.8248016511111271e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0943679340924120e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 1.0541649411122005e+08, - "cpu_time": 1.8261701744444913e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0928549324887667e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0531321896447077e+08, - "cpu_time": 1.8236700984444574e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0978517052594862e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0527157038450241e+08, - "cpu_time": 1.8242087822222352e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0998660895727987e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2088366298419700e+04, - "cpu_time": 2.2068223979406329e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9726154009468374e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7946877994597831e-04, - "cpu_time": 1.2100995678017612e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7927245252117962e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7309843003749847e+08, - "cpu_time": 3.1631299374998891e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.2030708410665207e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7302027344703674e+08, - "cpu_time": 3.1587986849999082e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.2058728876571980e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7280907183885574e+08, - "cpu_time": 3.1511488775001341e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.2134575029791431e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7322742566466331e+08, - "cpu_time": 3.1572473699998230e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1984516590263729e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7332270741462708e+08, - "cpu_time": 3.1802114125000000e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1950441463585434e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7309558168053630e+08, - "cpu_time": 3.1621072564999509e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.2031794074175558e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7309843003749847e+08, - "cpu_time": 3.1587986849999082e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.2030708410665207e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9794965758325611e+05, - "cpu_time": 1.0993834105757196e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0964770870059179e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1435858481274831e-03, - "cpu_time": 3.4767429482850517e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1440064233061173e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8665508063499560e+06, - "cpu_time": 2.0695740848805385e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1944219177241344e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8718214993150807e+06, - "cpu_time": 2.0746848435015006e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1882428434008104e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8669043349981275e+06, - "cpu_time": 2.0694213342173693e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1940063683038736e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8626848939467785e+06, - "cpu_time": 2.0701459257293148e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1989763342747292e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8770251101897585e+06, - "cpu_time": 2.0791693076923778e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1821764545205864e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8689973289599405e+06, - "cpu_time": 2.0725990992042203e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1915647836448266e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8669043349981278e+06, - "cpu_time": 2.0701459257293150e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1940063683038736e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5370150367055267e+03, - "cpu_time": 4.2657042477899104e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4852070952372242e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9625590956765917e-03, - "cpu_time": 2.0581424788941277e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9591674148238376e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8736120451533694e+06, - "cpu_time": 2.0768588121692725e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3723032317127436e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8735587160027875e+06, - "cpu_time": 2.0771617354498440e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3724276853610026e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8669791954774938e+06, - "cpu_time": 2.0703525820104319e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3878367899567485e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8722558559689093e+06, - "cpu_time": 2.0757880185186800e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3754703577949638e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8668717141269348e+06, - "cpu_time": 2.0704886825396465e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3880894107558373e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8706555053458989e+06, - "cpu_time": 2.0741299661375750e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3792254951162590e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8722558559689093e+06, - "cpu_time": 2.0757880185186800e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3754703577949638e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4483043696020782e+03, - "cpu_time": 3.4247240988604490e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0770106430370870e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8433668624434725e-03, - "cpu_time": 1.6511617665106769e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8443924963545775e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8636640545862194e+06, - "cpu_time": 2.0734630211640247e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7912840083389711e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8635213974453374e+06, - "cpu_time": 2.0738160396825501e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7919570027263891e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8677571795744668e+06, - "cpu_time": 2.0730797883599070e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7720182147728559e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8743108790735872e+06, - "cpu_time": 2.0797676005293725e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7413460503937807e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8702630252283553e+06, - "cpu_time": 2.0751193571426382e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7602651493361723e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8679033071815935e+06, - "cpu_time": 2.0750491613756984e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7713740851136353e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8677571795744668e+06, - "cpu_time": 2.0738160396825499e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7720182147728559e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5776357322931817e+03, - "cpu_time": 2.7469735824505719e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1480035885004796e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4506813145484486e-03, - "cpu_time": 1.3238113262961954e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4488792379132140e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8775307615485755e+06, - "cpu_time": 2.0849050372341233e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7452710054653466e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8708860888124190e+06, - "cpu_time": 2.0786579680850899e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7514695414085910e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8674367102574522e+06, - "cpu_time": 2.0800652898936064e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7547047147575069e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8685200956245721e+06, - "cpu_time": 2.0812309893617181e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7536873206090383e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8710494742527830e+06, - "cpu_time": 2.0779417313830669e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7513165980330978e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8710846260991606e+06, - "cpu_time": 2.0805602031915213e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7512898360547163e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8708860888124190e+06, - "cpu_time": 2.0800652898936062e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7514695414085910e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9203769423985700e+03, - "cpu_time": 2.7407740294323494e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6629448747515642e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0952429877914057e-03, - "cpu_time": 1.3173250287245131e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0915697672313342e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8770654348978298e+06, - "cpu_time": 2.0903324827585267e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4914073202550434e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8718015555099682e+06, - "cpu_time": 2.0849420477453163e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5012258541555099e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8786204650652884e+06, - "cpu_time": 2.0916641034484529e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4885173039846770e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8759182900893169e+06, - "cpu_time": 2.0894089973474026e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4935423544956043e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8672502311281627e+06, - "cpu_time": 2.0862929920424684e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5097599083120316e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8741311953381132e+06, - "cpu_time": 2.0885281246684338e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4968905482405730e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8759182900893167e+06, - "cpu_time": 2.0894089973474026e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4935423544956043e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6024966679139743e+03, - "cpu_time": 2.8161042797084565e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5994580628665193e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4558028164531113e-03, - "cpu_time": 1.3483678991182029e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4591727834299116e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8678145662558195e+06, - "cpu_time": 2.0979667526596151e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0173989628287390e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8782775920779852e+06, - "cpu_time": 2.1032496196807688e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9783082411685377e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8728967328996153e+06, - "cpu_time": 2.0982842632978032e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9983570208419636e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8689358625356653e+06, - "cpu_time": 2.0983276170214023e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0131887684026256e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8781541888568022e+06, - "cpu_time": 2.1035033670211467e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9787667475683197e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8732157885251779e+06, - "cpu_time": 2.1002663239361471e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9972039481620371e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8728967328996155e+06, - "cpu_time": 2.0983276170214023e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9983570208419636e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9396968027350131e+03, - "cpu_time": 2.8440146961677774e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8450344039136506e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6370142900750053e-03, - "cpu_time": 1.3541209815894956e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6368166736061593e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8735877588079211e+06, - "cpu_time": 2.1211186037233691e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3991551704350924e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8734851832476200e+06, - "cpu_time": 2.1210729840424000e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3992317758584175e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8738000679227395e+06, - "cpu_time": 2.1212696063827858e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3989966405039576e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8741460839822702e+06, - "cpu_time": 2.1211571569147226e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3987383493766111e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8868818952274097e+06, - "cpu_time": 2.1342680904254811e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3892973410951406e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8763801978375923e+06, - "cpu_time": 2.1237772882977515e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3970838554538438e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8738000679227393e+06, - "cpu_time": 2.1211571569147226e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3989966405039576e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8760702934378342e+03, - "cpu_time": 5.8649883099735343e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3568856555457134e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1315989692332225e-03, - "cpu_time": 2.7615834966737188e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1185570132655892e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8997033882725944e+06, - "cpu_time": 2.1814506129034744e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7598413691136098e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8988397120753482e+06, - "cpu_time": 2.1820103736558240e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7610966669060040e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8947867844666864e+06, - "cpu_time": 2.1783396962364940e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7670026216040343e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8944027183498559e+06, - "cpu_time": 2.1780581451614895e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7675635962805623e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8962994808555201e+06, - "cpu_time": 2.1794922634408753e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7647953569204491e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8968064168040012e+06, - "cpu_time": 2.1798702182796309e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7640599221649325e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8962994808555201e+06, - "cpu_time": 2.1794922634408753e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7647953569204491e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3790963853702146e+03, - "cpu_time": 1.7921264444108936e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4660189027182182e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2542642012877841e-03, - "cpu_time": 8.2212529414950764e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2539593931825764e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 371, - "real_time": 1.8986855991902659e+06, - "cpu_time": 2.2651512291105674e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5226415602835310e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 371, - "real_time": 1.8920125546450964e+06, - "cpu_time": 2.2610162210243912e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5421196726503313e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 371, - "real_time": 1.8979925368102947e+06, - "cpu_time": 2.2651656765500437e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5246581831254363e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 371, - "real_time": 1.8919978990229573e+06, - "cpu_time": 2.2620871509434925e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5421626025139499e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 371, - "real_time": 1.9001647856838328e+06, - "cpu_time": 2.2663612614556681e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5183424506135011e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8961706750704895e+06, - "cpu_time": 2.2639563078168328e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5299848938373494e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8979925368102945e+06, - "cpu_time": 2.2651512291105678e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5246581831254363e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8826205239264664e+03, - "cpu_time": 2.2810123519687595e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1329103278900762e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0476113120893673e-03, - "cpu_time": 1.0075337337973516e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0486680337094567e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 362, - "real_time": 1.9381477002913740e+06, - "cpu_time": 2.4480741685083662e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0820393098445086e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 362, - "real_time": 1.9404009619382988e+06, - "cpu_time": 2.4537307762432257e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0807828078507650e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 362, - "real_time": 1.9390511257993316e+06, - "cpu_time": 2.4527986961326976e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0815351756831553e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 362, - "real_time": 1.9397583170420907e+06, - "cpu_time": 2.4530312872928297e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0811408728474569e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 362, - "real_time": 1.9400606373420181e+06, - "cpu_time": 2.4536408867401308e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0809723983025630e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9394837484826227e+06, - "cpu_time": 2.4522551629834501e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0812941129056897e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9397583170420907e+06, - "cpu_time": 2.4530312872928297e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0811408728474569e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9744865129603602e+02, - "cpu_time": 2.3704523220041583e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0046113775197370e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6272553301782772e-04, - "cpu_time": 9.6664179070184153e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6283534866116839e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 356, - "real_time": 1.9720594256101281e+06, - "cpu_time": 2.7933543960671797e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1268649136687856e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 356, - "real_time": 1.9693609274429365e+06, - "cpu_time": 2.7927845646066605e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1297792301820374e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 356, - "real_time": 1.9679703976006738e+06, - "cpu_time": 2.7918885589886950e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1312840910176523e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 356, - "real_time": 1.9671749039108371e+06, - "cpu_time": 2.7928226966292039e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1321459478064325e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 356, - "real_time": 1.9659798695663973e+06, - "cpu_time": 2.7916791460676338e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1334419873409314e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9685091048261947e+06, - "cpu_time": 2.7925058724718746e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1307032340031679e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9679703976006738e+06, - "cpu_time": 2.7927845646066600e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1312840910176523e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3344007791938338e+03, - "cpu_time": 7.0046263689235286e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5251769188870708e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1858724826167085e-03, - "cpu_time": 2.5083658508918950e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1851377885895285e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 349, - "real_time": 2.0109855127587572e+06, - "cpu_time": 3.5154923810890336e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1713915623848243e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 349, - "real_time": 2.0026650348475424e+06, - "cpu_time": 3.5121190830945293e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1887224543462424e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 349, - "real_time": 2.0099017391499016e+06, - "cpu_time": 3.5158403667619727e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1736408485063581e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 349, - "real_time": 2.0058100621474849e+06, - "cpu_time": 3.5120531747849747e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1821547106104784e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 349, - "real_time": 2.0267462616727652e+06, - "cpu_time": 3.5337924212032435e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1389532368380947e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0112217221152901e+06, - "cpu_time": 3.5178594853867507e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1709725625371995e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0099017391499013e+06, - "cpu_time": 3.5154923810890340e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1736408485063581e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2912921459366971e+03, - "cpu_time": 9.0857570928348632e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9187441360723425e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6197254354257058e-03, - "cpu_time": 2.5827515654270037e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6002319778032097e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 197, - "real_time": 3.5496114701183918e+06, - "cpu_time": 6.4839768730967157e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7264936292986517e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 197, - "real_time": 3.5474088402266428e+06, - "cpu_time": 6.4843571827412024e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7294283674751482e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 197, - "real_time": 3.5486847556995107e+06, - "cpu_time": 6.4880827055834942e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7277279203384476e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 197, - "real_time": 3.5473998839290915e+06, - "cpu_time": 6.4808901218276070e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7294403080990114e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 197, - "real_time": 3.5477784157347707e+06, - "cpu_time": 6.4784649086296037e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7289356983489389e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5481766731416816e+06, - "cpu_time": 6.4831543583757244e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7284051847120390e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5477784157347707e+06, - "cpu_time": 6.4839768730967157e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7289356983489389e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5764921617392099e+02, - "cpu_time": 3.6581972741932159e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2759858216140177e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6989896625581063e-04, - "cpu_time": 5.6426194287154563e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6985543153948757e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 99, - "real_time": 7.1646357566645052e+06, - "cpu_time": 1.3405315373736840e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6833409456702461e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 99, - "real_time": 7.1491836382057332e+06, - "cpu_time": 1.3369780707069946e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6934634355568638e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 99, - "real_time": 7.1607197898280136e+06, - "cpu_time": 1.3395559787878400e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6859021138719788e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 99, - "real_time": 7.1520005644421382e+06, - "cpu_time": 1.3374278545454374e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6916148422615891e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 99, - "real_time": 7.1636240769441081e+06, - "cpu_time": 1.3402284828283321e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6840023484752436e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1580327652169000e+06, - "cpu_time": 1.3389443848484578e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6876647371671848e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1607197898280146e+06, - "cpu_time": 1.3395559787878400e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6859021138719788e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0138587671925925e+03, - "cpu_time": 1.6361741479303208e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5946528147750180e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.7985843279107436e-04, - "cpu_time": 1.2219881321773522e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.8015815387676904e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50, - "real_time": 1.4220062084496021e+07, - "cpu_time": 2.6268008720001034e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7193087907237806e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50, - "real_time": 1.4253691025078297e+07, - "cpu_time": 2.6289347119998183e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7081744568425827e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50, - "real_time": 1.4217114988714457e+07, - "cpu_time": 2.6305320740000296e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7202870662065411e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50, - "real_time": 1.4253707099705935e+07, - "cpu_time": 2.6343873260000240e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7081691471957150e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50, - "real_time": 1.4230644721537828e+07, - "cpu_time": 2.6305629900000438e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7157992707408342e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4235043983906511e+07, - "cpu_time": 2.6302435948000040e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7143477463418913e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4230644721537832e+07, - "cpu_time": 2.6305320740000300e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7157992707408342e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7757278252070584e+04, - "cpu_time": 2.7803442346793105e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8796044841128560e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2474340277519446e-03, - "cpu_time": 1.0570672009908343e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2471724192758475e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.7305466409486074e+07, - "cpu_time": 4.8998865576921754e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9154160557891808e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.7396002282889988e+07, - "cpu_time": 4.9097953076922685e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8991720256872988e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.7419442454209693e+07, - "cpu_time": 4.9204395115387239e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8949838503880157e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.7384463697671890e+07, - "cpu_time": 4.9153214076922655e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9012363171242466e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.7393306892078657e+07, - "cpu_time": 4.9102060423076816e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8996540844366560e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7379736347267263e+07, - "cpu_time": 4.9111297653846227e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9020924666850796e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time_median", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7393306892078657e+07, - "cpu_time": 4.9102060423076816e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8996540844366560e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3484729434165267e+04, - "cpu_time": 7.6368350701157528e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7983672639444210e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5882084795351005e-03, - "cpu_time": 1.5550057593555892e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5908241872103805e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.3086633235216141e+07, - "cpu_time": 9.1993131100002751e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0565545343705778e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.3266233205795288e+07, - "cpu_time": 9.2122951600003943e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0395051394547386e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.3215737640857697e+07, - "cpu_time": 9.2416827200008810e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0442870455280895e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.3153721615672112e+07, - "cpu_time": 9.2045481299999207e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0501723649930305e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.3138089179992676e+07, - "cpu_time": 9.2040618199996516e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0516580506073256e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3172082975506783e+07, - "cpu_time": 9.2123801880002245e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0484354269907522e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time_median", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3153721615672112e+07, - "cpu_time": 9.2045481299999207e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0501723649930305e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9936348656208502e+04, - "cpu_time": 1.7028876339358985e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6385477609971296e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3152832227472451e-03, - "cpu_time": 1.8484773741253423e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3149713127962506e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0422693565487862e+08, - "cpu_time": 1.7837412900000516e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1509804891291590e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0451261885464191e+08, - "cpu_time": 1.7852095075001273e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1369003846960335e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0438843816518784e+08, - "cpu_time": 1.7836315824999359e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1430112514035044e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0440433677285910e+08, - "cpu_time": 1.7841464624999049e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1422280778241072e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0454489849507809e+08, - "cpu_time": 1.7831009262499720e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1353142977634201e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0441544558852911e+08, - "cpu_time": 1.7839659537499985e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1416869001632452e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time_median", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0440433677285910e+08, - "cpu_time": 1.7837412900000516e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1422280778241072e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2508946843038130e+05, - "cpu_time": 7.8891695427967905e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1631641020761402e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1979977456910206e-03, - "cpu_time": 4.4222646324686317e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1986657728770811e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7617597430944443e+08, - "cpu_time": 3.0971456175001323e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0947119958254089e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7633265629410744e+08, - "cpu_time": 3.0959061174999648e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0892964840788918e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7621233314275742e+08, - "cpu_time": 3.0941087449997437e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0934544412967634e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7673009634017944e+08, - "cpu_time": 3.1005951925001794e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0756025500784254e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7635421082377434e+08, - "cpu_time": 3.1076009124998903e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0885522323760061e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7636105418205261e+08, - "cpu_time": 3.0990713169999826e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0883235407311001e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time_median", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7633265629410744e+08, - "cpu_time": 3.0971456175001323e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0892964840788918e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1989650568382433e+05, - "cpu_time": 5.3251789459306828e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5822328648386952e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2468541124551868e-03, - "cpu_time": 1.7183144242984560e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2453728541384650e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8662308527464073e+06, - "cpu_time": 2.0674684682539222e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1947981376324319e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8618054294998131e+06, - "cpu_time": 2.0675782222221121e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2000150687606591e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8671303258559890e+06, - "cpu_time": 2.0680800105818766e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1937408135247235e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8640767711552880e+06, - "cpu_time": 2.0691741269840670e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1973343927575718e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8638012103716999e+06, - "cpu_time": 2.0696458862432707e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1976592660239395e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8646089179258395e+06, - "cpu_time": 2.0683893428570498e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1967095357398652e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time_median", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8640767711552877e+06, - "cpu_time": 2.0680800105818764e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1973343927575718e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1085118889875221e+03, - "cpu_time": 9.7421770941350883e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4842371453498431e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1308065024879300e-03, - "cpu_time": 4.7100305983390416e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1308901358745807e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8662278972062275e+06, - "cpu_time": 2.0686537566138376e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3896032270568628e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8714782807499568e+06, - "cpu_time": 2.0732478015874962e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3772883096015537e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8663637692471547e+06, - "cpu_time": 2.0687028730159390e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3892836621579146e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8616721011567665e+06, - "cpu_time": 2.0686691851851142e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4003452567774039e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8667989085659706e+06, - "cpu_time": 2.0687109285714184e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3882605471913917e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8665081913852151e+06, - "cpu_time": 2.0695969089947611e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3889562005570261e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time_median", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8663637692471545e+06, - "cpu_time": 2.0687028730159388e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3892836621579146e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4739565357941874e+03, - "cpu_time": 2.0410466829446518e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1679264337139139e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8612061558733457e-03, - "cpu_time": 9.8620493395306795e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8610179870733909e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8676533394123751e+06, - "cpu_time": 2.0712771443567628e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7725059325811192e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8629079086573434e+06, - "cpu_time": 2.0710637007874332e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7948523509186599e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8679426849778164e+06, - "cpu_time": 2.0711348845145104e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7711470655720755e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8736901009182464e+06, - "cpu_time": 2.0773768057744096e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7442421732231118e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8676650769642817e+06, - "cpu_time": 2.0710995905512171e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7724508007777762e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8679718221860125e+06, - "cpu_time": 2.0723904251968667e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7710396646145489e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time_median", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8676650769642820e+06, - "cpu_time": 2.0711348845145106e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7724508007777762e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8255164609241656e+03, - "cpu_time": 2.7886475057199764e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7953428334578435e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0479519099208449e-03, - "cpu_time": 1.3456187945160329e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0468985457914256e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 373, - "real_time": 1.8709001957498812e+06, - "cpu_time": 2.0760950134046953e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7514563350006044e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 373, - "real_time": 1.8662455849355427e+06, - "cpu_time": 2.0769454557639326e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7558246494730089e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 373, - "real_time": 1.8708928955260704e+06, - "cpu_time": 2.0765002493297546e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7514631691829730e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 373, - "real_time": 1.8663609819549159e+06, - "cpu_time": 2.0765049517425743e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7557160869103268e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 373, - "real_time": 1.8709726778447977e+06, - "cpu_time": 2.0764127426274165e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7513884830079917e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8690744672022418e+06, - "cpu_time": 2.0764916825736747e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7531697447149809e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time_median", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8708928955260706e+06, - "cpu_time": 2.0765002493297546e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7514631691829730e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5302542859802516e+03, - "cpu_time": 3.0403022509686804e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3745233214071093e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3537471782853621e-03, - "cpu_time": 1.4641533488833560e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3544172368735144e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8780822733462546e+06, - "cpu_time": 2.0901844827586075e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4895169892228350e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8782299668518878e+06, - "cpu_time": 2.0899375490718489e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4892425931125611e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8717068371902448e+06, - "cpu_time": 2.0831794297081535e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5014030348032951e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8676304325105657e+06, - "cpu_time": 2.0845208355439203e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5090454117254399e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8725743517588419e+06, - "cpu_time": 2.0847399204245056e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4997809266395420e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8736447723315593e+06, - "cpu_time": 2.0865124435014073e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4977977911007345e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time_median", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8725743517588419e+06, - "cpu_time": 2.0847399204245056e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4997809266395420e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5218663275038261e+03, - "cpu_time": 3.2951684985784727e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4439722702055340e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4134064227536718e-03, - "cpu_time": 1.5792709546696023e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4140824525903399e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8806865100486903e+06, - "cpu_time": 2.1038978563829102e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9693699242095694e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8702115833141934e+06, - "cpu_time": 2.0973138776593683e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0084048868806541e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8705575296328962e+06, - "cpu_time": 2.0976361329787248e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0071087322143659e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8745201083375118e+06, - "cpu_time": 2.0976538537231614e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9922962905021116e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8709324330631443e+06, - "cpu_time": 2.0976617686171308e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0057046253351405e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8733816328792870e+06, - "cpu_time": 2.0988326978722597e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9965768918283686e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time_median", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8709324330631446e+06, - "cpu_time": 2.0976538537231619e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0057046253351405e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4351073819486492e+03, - "cpu_time": 2.8352760873188727e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6527849848815787e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3674340049614591e-03, - "cpu_time": 1.3508823691346147e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3622765967339599e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8756399760022762e+06, - "cpu_time": 2.1213301679999861e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3976242954617101e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8765142098612462e+06, - "cpu_time": 2.1216119759998643e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3969731677085650e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8768338005368907e+06, - "cpu_time": 2.1216219146666238e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3967352885748890e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8762966092132654e+06, - "cpu_time": 2.1214767626667405e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3971351795488107e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8760785869865990e+06, - "cpu_time": 2.1213533039999674e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3972975429620025e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8762726365200556e+06, - "cpu_time": 2.1214788250666363e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3971530948511955e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time_median", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8762966092132654e+06, - "cpu_time": 2.1214767626667405e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3971351795488107e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5048639692775453e+02, - "cpu_time": 1.3789717383492322e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3546687317826181e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4009644875665656e-04, - "cpu_time": 6.5000495034680275e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4010745451914192e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 371, - "real_time": 1.8994800491174408e+06, - "cpu_time": 2.1811311940699904e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7601658687786746e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 371, - "real_time": 1.8973413484096981e+06, - "cpu_time": 2.1788452884097467e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7632771532620871e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 371, - "real_time": 1.8974603317719395e+06, - "cpu_time": 2.1791337277627243e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7631038774359763e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 371, - "real_time": 1.8975530885821434e+06, - "cpu_time": 2.1792610269540213e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7629688104892462e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 371, - "real_time": 1.9001808120100948e+06, - "cpu_time": 2.1819505471697543e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7591479541643465e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8984031259782636e+06, - "cpu_time": 2.1800643568732473e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7617327328260660e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time_median", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8975530885821437e+06, - "cpu_time": 2.1792610269540213e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7629688104892462e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3284132610361219e+03, - "cpu_time": 1.3868483020892795e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9319228561202955e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.9975298863437097e-04, - "cpu_time": 6.3615016580444595e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9953288135284888e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8923901844837314e+06, - "cpu_time": 2.2600984408601588e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5410137327787149e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8986783983838065e+06, - "cpu_time": 2.2637749623654406e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5226625051012814e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8931493139325050e+06, - "cpu_time": 2.2607742768817237e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5387918548372042e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8989196677300427e+06, - "cpu_time": 2.2640923897849964e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5219608170863879e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8932727931921058e+06, - "cpu_time": 2.2605182043011403e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5384306148089433e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8952820715444386e+06, - "cpu_time": 2.2618516548386919e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5325719049225068e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time_median", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8932727931921061e+06, - "cpu_time": 2.2607742768817237e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5384306148089433e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2293965112130836e+03, - "cpu_time": 1.9191533154972756e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4216254686757736e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7039133961635031e-03, - "cpu_time": 8.4848770315758986e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7029377350329692e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 363, - "real_time": 1.9410442592660813e+06, - "cpu_time": 2.4531829834708604e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0804246167951596e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 363, - "real_time": 1.9418270459922017e+06, - "cpu_time": 2.4534328732783222e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0799890774661825e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 363, - "real_time": 1.9424225478856398e+06, - "cpu_time": 2.4535437410467044e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0796579777570980e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 363, - "real_time": 1.9406616553399947e+06, - "cpu_time": 2.4530542286501341e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0806376238894610e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 363, - "real_time": 1.9443835529175487e+06, - "cpu_time": 2.4575433168043052e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0785690903696558e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9420678122802936e+06, - "cpu_time": 2.4541514286500653e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0798556772555115e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time_median", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9418270459922017e+06, - "cpu_time": 2.4534328732783222e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0799890774661825e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4638475473410804e+03, - "cpu_time": 1.9060591017211730e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1352923409057653e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.5375717474164452e-04, - "cpu_time": 7.7666727467164609e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5336848360902048e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 355, - "real_time": 1.9729406753240128e+06, - "cpu_time": 2.7929141690143473e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1259149109038348e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 355, - "real_time": 1.9712613331495037e+06, - "cpu_time": 2.7921048478873046e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1277260043947189e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 355, - "real_time": 1.9710742661886860e+06, - "cpu_time": 2.7928573887323528e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1279279385602255e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 355, - "real_time": 1.9708106254922673e+06, - "cpu_time": 2.7919186676056813e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1282125972668483e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 355, - "real_time": 1.9728946771708804e+06, - "cpu_time": 2.7910574478873587e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1259644767325380e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9717963154650703e+06, - "cpu_time": 2.7921705042254091e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1271491855716333e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time_median", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9712613331495035e+06, - "cpu_time": 2.7921048478873046e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1277260043947189e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0362316197282794e+03, - "cpu_time": 7.6345833088098777e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1176973644059468e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.2552670455917382e-04, - "cpu_time": 2.7342826296805357e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2544380619245828e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 348, - "real_time": 2.0123664681109246e+06, - "cpu_time": 3.5156520028736517e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1685290094674783e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 348, - "real_time": 2.0093071122584199e+06, - "cpu_time": 3.5129549597701863e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1748759802932148e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 348, - "real_time": 2.0174142940039476e+06, - "cpu_time": 3.5173984683905314e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1580988223054519e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 348, - "real_time": 2.0106216389471772e+06, - "cpu_time": 3.5142273505749502e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1721464832103024e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 348, - "real_time": 2.0153531329652786e+06, - "cpu_time": 3.5181437155173146e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1623514325042720e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0130125292571497e+06, - "cpu_time": 3.5156752994253272e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1672003455561442e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time_median", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0123664681109246e+06, - "cpu_time": 3.5156520028736517e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1685290094674783e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3435693957993049e+03, - "cpu_time": 2.1540505863707522e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9190800933072018e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6609779359064211e-03, - "cpu_time": 6.1269895622125686e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6603665577743655e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 197, - "real_time": 3.5519911233940856e+06, - "cpu_time": 6.4838025837559877e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7233271191197748e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 197, - "real_time": 3.5451979631662066e+06, - "cpu_time": 6.4720434670048486e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7323777612171240e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 197, - "real_time": 3.5476824528712607e+06, - "cpu_time": 6.4710993553304151e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7290636134645100e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 197, - "real_time": 3.5471423543271073e+06, - "cpu_time": 6.4738581878167782e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7297836748879614e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 197, - "real_time": 3.5487333794838279e+06, - "cpu_time": 6.4732931218275344e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7276631422900209e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5481494546484975e+06, - "cpu_time": 6.4748193431471130e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7284430621958780e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time_median", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5476824528712607e+06, - "cpu_time": 6.4732931218275335e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7290636134645100e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5021506070516216e+03, - "cpu_time": 5.1355520792510488e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3333665899567660e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.0519876319570106e-04, - "cpu_time": 7.9315758588484309e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0496071246097620e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100, - "real_time": 7.1427542902529240e+06, - "cpu_time": 1.3261001459999306e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6976881237240267e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100, - "real_time": 7.1469335211440921e+06, - "cpu_time": 1.3247606319999931e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6949411101600056e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100, - "real_time": 7.1517271408811212e+06, - "cpu_time": 1.3282232709999561e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6917942112464266e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100, - "real_time": 7.1523991553112864e+06, - "cpu_time": 1.3298100669999259e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6913533866580811e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100, - "real_time": 7.1424279222264886e+06, - "cpu_time": 1.3263534919999529e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6979027811512270e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1472484059631824e+06, - "cpu_time": 1.3270495215999519e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6947359225879536e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time_median", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1469335211440939e+06, - "cpu_time": 1.3263534919999529e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6949411101600056e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7466455848916657e+03, - "cpu_time": 1.9763024435266201e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1177636842839774e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.6412209500531488e-04, - "cpu_time": 1.4892454361039211e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6409777582661627e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50, - "real_time": 1.4288020543754101e+07, - "cpu_time": 2.6407726299999014e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6968622276607885e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50, - "real_time": 1.4280122853815556e+07, - "cpu_time": 2.6429211600000143e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6994598496797209e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50, - "real_time": 1.4259607717394829e+07, - "cpu_time": 2.6383650479999684e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7062209094389105e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50, - "real_time": 1.4290106948465109e+07, - "cpu_time": 2.6391372999999024e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6961764696385365e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50, - "real_time": 1.4307553451508284e+07, - "cpu_time": 2.6420818880001206e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6904499939453640e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4285082302987579e+07, - "cpu_time": 2.6406556051999815e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6978338900726643e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time_median", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4288020543754101e+07, - "cpu_time": 2.6407726299999014e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6968622276607885e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7409648789022576e+04, - "cpu_time": 1.9191546938628886e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7271050894217053e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2187293303435520e-03, - "cpu_time": 7.2677205239626375e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2190948474198012e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.7400063350796700e+07, - "cpu_time": 4.9284043038465619e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8984459007134895e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.7396457413068183e+07, - "cpu_time": 4.9244612538455635e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8990906370243979e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.7384765374545868e+07, - "cpu_time": 4.9223097884613223e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9011823239776716e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.7367841667280748e+07, - "cpu_time": 4.9279446307694420e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9042131137605267e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.7417331145933039e+07, - "cpu_time": 4.9396710576930813e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8953607951702194e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7393291790324915e+07, - "cpu_time": 4.9285582069231942e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8996585541292620e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time_median", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7396457413068186e+07, - "cpu_time": 4.9279446307694413e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8990906370243979e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8399553968638567e+04, - "cpu_time": 6.7030472896388586e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2912641246062280e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7168101261700633e-04, - "cpu_time": 1.3600422290281613e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7173336432443129e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.3139927610754967e+07, - "cpu_time": 9.2058440599998906e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0514832832717571e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.3062470629811287e+07, - "cpu_time": 9.1879854400008291e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0588570945505304e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.3090519085526466e+07, - "cpu_time": 9.1986109799995571e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0561844303605776e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.3248919546604156e+07, - "cpu_time": 9.2517094300001189e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0411437130674877e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.3219959884881973e+07, - "cpu_time": 9.2577525600017905e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0438868533655853e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3152359351515777e+07, - "cpu_time": 9.2203804940004379e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0503110749231873e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time_median", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3139927610754967e+07, - "cpu_time": 9.2058440599998906e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0514832832717571e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0548824248155957e+04, - "cpu_time": 3.2065685416815226e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6520581220165864e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5154327151398388e-03, - "cpu_time": 3.4776965481717248e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5151657013786957e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0440095234662294e+08, - "cpu_time": 1.7829078012499622e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1423947764147587e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0444433242082596e+08, - "cpu_time": 1.7837555662498516e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1402589260357914e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0448521282523870e+08, - "cpu_time": 1.7849422300000128e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1382477719403877e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0460723377764225e+08, - "cpu_time": 1.7839600000002065e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1322541722228928e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0450225602835417e+08, - "cpu_time": 1.7875780637498906e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1374097785442352e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0448799747973680e+08, - "cpu_time": 1.7846287322499847e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1381130850316133e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time_median", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0448521282523870e+08, - "cpu_time": 1.7839600000002065e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1382477719403877e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7317281093847225e+04, - "cpu_time": 1.8005597968991913e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8005642541917376e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.3996327768499203e-04, - "cpu_time": 1.0089268229079339e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3968092786115742e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7942670360207558e+08, - "cpu_time": 3.0796398924996990e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9842922064783401e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7946901917457581e+08, - "cpu_time": 3.0724668325001401e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9828812178191805e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7971289530396461e+08, - "cpu_time": 3.0775671275000602e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9747622572319241e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7959230020642281e+08, - "cpu_time": 3.0652552250001007e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9787742724261818e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7940849438309669e+08, - "cpu_time": 3.0800912149999249e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9848995873473234e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7952188253402713e+08, - "cpu_time": 3.0750040584999859e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9811219082605896e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time_median", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7946901917457581e+08, - "cpu_time": 3.0775671275000608e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9828812178191805e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2860303601241519e+05, - "cpu_time": 6.2333119448830909e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2829130106318993e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipManaged_HostToGPUWriteDst/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1636412339893651e-04, - "cpu_time": 2.0270906399791084e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1607184677455302e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - } - ] -} diff --git a/results/hipMemcpyAsync_GPUToGPU.json b/results/hipMemcpyAsync_GPUToGPU.json deleted file mode 100644 index 48c81a4..0000000 --- a/results/hipMemcpyAsync_GPUToGPU.json +++ /dev/null @@ -1,2030 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:55:39-04:00", - "host_name": "frontier10485", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1798, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [2.22,9.02,32.42], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100226, - "real_time": 6.9836825848939588e+03, - "cpu_time": 1.7107840925828562e+09, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6656877927662447e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100226, - "real_time": 6.9830192688770348e+03, - "cpu_time": 1.7051092855150082e+09, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6660359959334366e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100226, - "real_time": 6.9862540304095701e+03, - "cpu_time": 1.7117225139865437e+09, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6643385551926740e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100226, - "real_time": 6.9794356667886459e+03, - "cpu_time": 1.7080383822809827e+09, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6679183278121658e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100226, - "real_time": 6.9619454732814274e+03, - "cpu_time": 1.7061017414887834e+09, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6771330798621945e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9788674048501271e+03, - "cpu_time": 1.7083512031708350e+09, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6682227503133431e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9830192688770348e+03, - "cpu_time": 1.7080383822809827e+09, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6660359959334366e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7680712088385828e+00, - "cpu_time": 2.8702200423025452e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1425072180309093e+04, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3996642495385475e-03, - "cpu_time": 1.6801112306270456e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4019070182124658e-03, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 99149, - "real_time": 7.0545073947904903e+03, - "cpu_time": 1.6932919841619306e+09, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.2577711149341807e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 99149, - "real_time": 7.0547944566138613e+03, - "cpu_time": 1.6911176557559247e+09, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.2574757939262241e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 99149, - "real_time": 7.0709511069137598e+03, - "cpu_time": 1.7025135321805902e+09, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.2408929471932292e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 99149, - "real_time": 7.0521106007904345e+03, - "cpu_time": 1.6917240978340182e+09, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.2602378065739989e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 99149, - "real_time": 7.0382274805403767e+03, - "cpu_time": 1.6937662259639750e+09, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.2745588490227371e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0541182079297851e+03, - "cpu_time": 1.6944826991792874e+09, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.2581873023300752e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0545073947904893e+03, - "cpu_time": 1.6932919841619306e+09, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.2577711149341807e+07, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1624338370938759e+01, - "cpu_time": 4.6194916776733939e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1958326434957360e+05, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6478797247643832e-03, - "cpu_time": 2.7261958354079488e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6475637699675252e-03, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 97395, - "real_time": 7.1555680512686249e+03, - "cpu_time": 1.6689031021438215e+09, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4310534015792820e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 97395, - "real_time": 7.2052801918498653e+03, - "cpu_time": 1.6674288520265851e+09, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4211799856975457e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 97395, - "real_time": 7.1499441040749571e+03, - "cpu_time": 1.6711552149299939e+09, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4321790283876392e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 97395, - "real_time": 7.2159938302655746e+03, - "cpu_time": 1.6692803941933672e+09, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4190699494574165e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 97395, - "real_time": 7.1633472900534416e+03, - "cpu_time": 1.6692657088893404e+09, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4294993088243255e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1780266935024920e+03, - "cpu_time": 1.6692066544366217e+09, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4265963347892419e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1633472900534425e+03, - "cpu_time": 1.6692657088893406e+09, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4294993088243255e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0384058203793124e+01, - "cpu_time": 1.3283954962595555e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0299768672441854e+05, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2329263321487214e-03, - "cpu_time": 7.9582446710764259e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2268276738107726e-03, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 87780, - "real_time": 8.0468166390487931e+03, - "cpu_time": 1.5449767433568487e+09, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5451058373340696e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 87780, - "real_time": 8.0393473498153344e+03, - "cpu_time": 1.5419386367218740e+09, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5474704735167873e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 87780, - "real_time": 7.9298600164472673e+03, - "cpu_time": 1.5421661454372964e+09, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5826433199984077e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 87780, - "real_time": 7.8580772127174878e+03, - "cpu_time": 1.5359045213303261e+09, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6062355262754649e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 87780, - "real_time": 7.9385118640028104e+03, - "cpu_time": 1.5405967149218662e+09, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5798286065259385e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9625226164063379e+03, - "cpu_time": 1.5411165523536425e+09, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5722567527301335e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9385118640028104e+03, - "cpu_time": 1.5419386367218738e+09, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5798286065259385e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9937047004715879e+01, - "cpu_time": 3.3209201010083100e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5842323063416723e+06, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0039161061848665e-02, - "cpu_time": 2.1548792633084724e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0046556602869555e-02, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 73315, - "real_time": 9.6020587579502226e+03, - "cpu_time": 1.3467827549828765e+09, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.2657518593172860e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 73315, - "real_time": 9.5627617457190627e+03, - "cpu_time": 1.3419919216124077e+09, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.2832814503965294e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 73315, - "real_time": 9.6089469410885304e+03, - "cpu_time": 1.3490836786921635e+09, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.2626939508690768e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 73315, - "real_time": 9.4972042395639619e+03, - "cpu_time": 1.3429542810245609e+09, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.3128481779265773e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 73315, - "real_time": 9.5776723234797828e+03, - "cpu_time": 1.3464799996685064e+09, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.2766132121252519e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5697288015603135e+03, - "cpu_time": 1.3454585271961033e+09, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.2802377301269442e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5776723234797846e+03, - "cpu_time": 1.3464799996685064e+09, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.2766132121252519e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4594674706124771e+01, - "cpu_time": 2.9252056240650211e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0021658980214403e+06, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6599726732960032e-03, - "cpu_time": 2.1741328810491582e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6776978856313657e-03, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 64940, - "real_time": 1.0778903203872545e+04, - "cpu_time": 1.2310589817732868e+09, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6000311395846415e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 64940, - "real_time": 1.0779383659210189e+04, - "cpu_time": 1.2269964574901321e+09, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.5996923933591878e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 64940, - "real_time": 1.0782155879800906e+04, - "cpu_time": 1.2329084578210638e+09, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.5977384220040298e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 64940, - "real_time": 1.0781170600983934e+04, - "cpu_time": 1.2301290097320161e+09, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.5984327706050432e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 64940, - "real_time": 1.0781205759214461e+04, - "cpu_time": 1.2315244851459081e+09, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.5984079916093576e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0780563820616408e+04, - "cpu_time": 1.2305234783924816e+09, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.5988605434324539e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0781170600983936e+04, - "cpu_time": 1.2310589817732871e+09, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.5984327706050432e+08, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3661395342325611e+00, - "cpu_time": 2.2120345405619568e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6296660793612158e+04, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2672245691083421e-04, - "cpu_time": 1.7976370052294260e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2672513233163554e-04, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 64656, - "real_time": 1.0832138033460400e+04, - "cpu_time": 1.2431032687248352e+09, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5125361170057042e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 64656, - "real_time": 1.0830693529977310e+04, - "cpu_time": 1.2387432429080260e+09, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5127378458869865e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 64656, - "real_time": 1.0830321281895463e+04, - "cpu_time": 1.2442221486928854e+09, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5127898400750453e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 64656, - "real_time": 1.0827312796477241e+04, - "cpu_time": 1.2417237969062314e+09, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5132101850175304e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 64656, - "real_time": 1.0828037600735866e+04, - "cpu_time": 1.2438982451700900e+09, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5131088941625540e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0829700648509257e+04, - "cpu_time": 1.2423381404804139e+09, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5128765764295642e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0830321281895463e+04, - "cpu_time": 1.2431032687248349e+09, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5127898400750453e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9861652759622803e+00, - "cpu_time": 2.2287631883863066e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7746540137465787e+05, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8339983166900208e-04, - "cpu_time": 1.7940068937466903e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8340253639823338e-04, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 64419, - "real_time": 1.0868259237274131e+04, - "cpu_time": 1.2606583302180681e+09, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0150182549582376e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 64419, - "real_time": 1.0866791549393767e+04, - "cpu_time": 1.2587995583388405e+09, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0154254685991511e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 64419, - "real_time": 1.0864623350506747e+04, - "cpu_time": 1.2623556426605194e+09, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0160272420738487e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 64419, - "real_time": 1.0861309877599266e+04, - "cpu_time": 1.2581063169595368e+09, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0169473451431336e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 64419, - "real_time": 1.0869310089426473e+04, - "cpu_time": 1.2591645842508390e+09, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0147267609814806e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0866058820840079e+04, - "cpu_time": 1.2598168864855609e+09, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0156290143511705e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0866791549393769e+04, - "cpu_time": 1.2591645842508390e+09, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0154254685991511e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1844351093711203e+00, - "cpu_time": 1.6985150378679405e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8389768240447377e+05, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9306256867151073e-04, - "cpu_time": 1.3482237427426382e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9310557704481074e-04, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 61528, - "real_time": 1.1378530874150587e+04, - "cpu_time": 1.2578314695076354e+09, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.7596187701949091e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 61528, - "real_time": 1.1379771624404220e+04, - "cpu_time": 1.2545871872119167e+09, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.7589907919994040e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 61528, - "real_time": 1.1378668726056181e+04, - "cpu_time": 1.2596279300975156e+09, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.7595489927506332e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 61528, - "real_time": 1.1375746122274115e+04, - "cpu_time": 1.2561463415096574e+09, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.7610287092886314e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 61528, - "real_time": 1.1377979823567852e+04, - "cpu_time": 1.2581617068367872e+09, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.7598977161351252e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1378139434090592e+04, - "cpu_time": 1.2572709270327027e+09, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.7598169960737410e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1378530874150587e+04, - "cpu_time": 1.2578314695076354e+09, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.7596187701949091e+09, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4875178470589203e+00, - "cpu_time": 1.9448850863483995e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5307653666808666e+05, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3073471771686120e-04, - "cpu_time": 1.5469100927502889e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3074660830047756e-04, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 54402, - "real_time": 1.2872900352726867e+04, - "cpu_time": 1.2219873761305933e+09, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0182009990641699e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 54402, - "real_time": 1.2879271086145052e+04, - "cpu_time": 1.2196264720567129e+09, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0176973457838110e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 54402, - "real_time": 1.2870982533605329e+04, - "cpu_time": 1.2233144934491539e+09, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0183527143928539e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 54402, - "real_time": 1.2875723391814741e+04, - "cpu_time": 1.2204729408438971e+09, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0179777555902149e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 54402, - "real_time": 1.2879906117457107e+04, - "cpu_time": 1.2231645487905903e+09, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0176471692006222e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2875756696349821e+04, - "cpu_time": 1.2217131662541895e+09, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0179751968063345e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2875723391814743e+04, - "cpu_time": 1.2219873761305931e+09, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0179777555902149e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8897644258090316e+00, - "cpu_time": 1.6308282291616707e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0753700415006974e+06, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0209987013126387e-04, - "cpu_time": 1.3348699794746754e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0210657893718542e-04, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 53657, - "real_time": 1.3047614560083683e+04, - "cpu_time": 1.2931754559897070e+09, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0091335377270580e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 53657, - "real_time": 1.3044742576471470e+04, - "cpu_time": 1.2893930209733064e+09, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0095758767430466e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 53657, - "real_time": 1.3045960553005478e+04, - "cpu_time": 1.2939173199679081e+09, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0093882618678337e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 53657, - "real_time": 1.3048622920946220e+04, - "cpu_time": 1.2909726480991273e+09, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0089782775406513e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 53657, - "real_time": 1.3046846124625206e+04, - "cpu_time": 1.2931760428601882e+09, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0092518720307243e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3046757347026414e+04, - "cpu_time": 1.2921268975780475e+09, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0092655651818630e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3046846124625206e+04, - "cpu_time": 1.2931754559897070e+09, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0092518720307243e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4930876292899358e+00, - "cpu_time": 1.8849513287840032e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2994601317004822e+06, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1444128142923091e-04, - "cpu_time": 1.4587973768808164e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1444281789064319e-04, - "dst_id": NaN, - "src_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 53054, - "real_time": 1.3195362925005311e+04, - "cpu_time": 1.2845629474138367e+09, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.9732745736494316e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 53054, - "real_time": 1.3191734740331931e+04, - "cpu_time": 1.2827732048927748e+09, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.9743673619896317e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 53054, - "real_time": 1.3196568726460369e+04, - "cpu_time": 1.2853985382903628e+09, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.9729115262269119e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 53054, - "real_time": 1.3197923345036001e+04, - "cpu_time": 1.2836313396672943e+09, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.9725037514875023e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 53054, - "real_time": 1.3199544885838070e+04, - "cpu_time": 1.2855353001063821e+09, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.9720157364100800e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3196226924534338e+04, - "cpu_time": 1.2843802660741305e+09, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.9730145899527115e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3196568726460368e+04, - "cpu_time": 1.2845629474138367e+09, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.9729115262269119e+10, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9550698976239578e+00, - "cpu_time": 1.1776980507759280e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8978511110042743e+06, - "dst_id": 0.0000000000000000e+00, - "src_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2393294041722726e-04, - "cpu_time": 9.1693876173892786e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2395717180364496e-04, - "dst_id": NaN, - "src_id": NaN - } \ No newline at end of file diff --git a/results/hipMemcpyAsync_GPUToPageable.json b/results/hipMemcpyAsync_GPUToPageable.json deleted file mode 100644 index c23588c..0000000 --- a/results/hipMemcpyAsync_GPUToPageable.json +++ /dev/null @@ -1,30584 +0,0 @@ -{ - "context": { - "date": "2023-10-09T14:56:12-04:00", - "host_name": "frontier10336", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1790, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [1.87,2.08,2.08], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 91522, - "real_time": 7.6305253585211722e+03, - "cpu_time": 1.4875198323900262e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3549459306117013e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 91522, - "real_time": 7.6738251164555459e+03, - "cpu_time": 1.4985112399204558e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3360155608842380e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 91522, - "real_time": 7.6504470728475280e+03, - "cpu_time": 1.4892168145363950e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3462096732696664e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 91522, - "real_time": 7.6815347266081344e+03, - "cpu_time": 1.5013827014269800e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3326673524398632e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 91522, - "real_time": 7.6722033634773961e+03, - "cpu_time": 1.4951677268853386e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3367207289975826e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6617071275819544e+03, - "cpu_time": 1.4943596630318392e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3413118492406100e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6722033634773952e+03, - "cpu_time": 1.4951677268853386e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3367207289975826e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0911969418699279e+01, - "cpu_time": 5.9254493501982736e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1341835356259398e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7294138330368582e-03, - "cpu_time": 3.9652096458334500e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7337117718305441e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 87428, - "real_time": 7.9979120342315464e+03, - "cpu_time": 1.5243032872763879e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4016708086886816e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 87428, - "real_time": 7.9701219159161456e+03, - "cpu_time": 1.5274028915221665e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4239920719098173e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 87428, - "real_time": 7.9684205580604503e+03, - "cpu_time": 1.5199398064693236e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4253636748889558e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 87428, - "real_time": 7.9890987669283804e+03, - "cpu_time": 1.5242810461179477e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4087328863609970e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 87428, - "real_time": 7.9966539117498005e+03, - "cpu_time": 1.5247373392963356e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4026779906993106e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9844414373772652e+03, - "cpu_time": 1.5241328741364327e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4124874865095526e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9890987669283813e+03, - "cpu_time": 1.5243032872763881e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4087328863609970e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4265425838162795e+01, - "cpu_time": 2.6782085366693146e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1461625776913151e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7866529487438648e-03, - "cpu_time": 1.7572014764045928e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7873915233403358e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 79849, - "real_time": 8.9583911031501884e+03, - "cpu_time": 1.6252476662199888e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1430623961482480e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 79849, - "real_time": 8.7998351470397320e+03, - "cpu_time": 1.6181916780423018e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1636581627832812e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 79849, - "real_time": 8.9674762848004375e+03, - "cpu_time": 1.6237615286352991e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1419043301353855e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 79849, - "real_time": 8.8528496797372936e+03, - "cpu_time": 1.6168986912797885e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1566896954590410e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 79849, - "real_time": 8.9806629129382691e+03, - "cpu_time": 1.6265585955991937e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1402276312194537e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9118430255331823e+03, - "cpu_time": 1.6221316319553142e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1491084431490821e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9583911031501866e+03, - "cpu_time": 1.6237615286352990e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1430623961482480e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0659685812863131e+01, - "cpu_time": 4.3264056900949313e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0446201189894343e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.0508422984747726e-03, - "cpu_time": 2.6671113520423066e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0907009274659757e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72374, - "real_time": 9.6415522355703106e+03, - "cpu_time": 1.7027556014590853e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1241392982805926e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72374, - "real_time": 9.6156648691108403e+03, - "cpu_time": 1.6996325572719499e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1298579223356172e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72374, - "real_time": 9.6067817061605110e+03, - "cpu_time": 1.6928533699947504e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1318273513872865e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72374, - "real_time": 9.6137390559957130e+03, - "cpu_time": 1.6965386298947127e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1302845730171371e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72374, - "real_time": 9.6106851803181798e+03, - "cpu_time": 1.6889149832812887e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1309614887751395e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6176846094311113e+03, - "cpu_time": 1.6961390283803579e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1294141267591545e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6137390559957130e+03, - "cpu_time": 1.6965386298947127e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1302845730171371e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3758412227213833e+01, - "cpu_time": 5.4572393068733831e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0412344940829539e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4305326890967415e-03, - "cpu_time": 3.2174481074729458e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4282024599468293e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 69246, - "real_time": 1.0104454057865818e+04, - "cpu_time": 1.7425526080928856e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0536578983319408e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 69246, - "real_time": 1.0104571556107065e+04, - "cpu_time": 1.7472643445108679e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0536107614819491e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 69246, - "real_time": 1.0103635053447491e+04, - "cpu_time": 1.7442782673367437e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0539864893500793e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 69246, - "real_time": 1.0104333275640234e+04, - "cpu_time": 1.7511328611038909e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0537063537628293e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 69246, - "real_time": 1.0104066876504099e+04, - "cpu_time": 1.7489831325997198e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0538132319024915e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0104212163912942e+04, - "cpu_time": 1.7468422427288220e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0537549469658589e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0104333275640234e+04, - "cpu_time": 1.7472643445108675e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0537063537628293e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7299742516825857e-01, - "cpu_time": 3.4693630723370219e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4964806714421673e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6915042867014796e-05, - "cpu_time": 1.9860769263956956e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6915913542387369e-05, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 62304, - "real_time": 1.1231232441453498e+04, - "cpu_time": 1.8999069610297978e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2939457381044340e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 62304, - "real_time": 1.1233429843685823e+04, - "cpu_time": 1.9006097923086782e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2925189492367077e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 62304, - "real_time": 1.1229049196356376e+04, - "cpu_time": 1.8982134293143299e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2953638876728368e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 62304, - "real_time": 1.1233984784087619e+04, - "cpu_time": 1.9051869751540915e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2921587107751477e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 62304, - "real_time": 1.1230876829419241e+04, - "cpu_time": 1.9025340475731951e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2941766920113349e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1231714619000511e+04, - "cpu_time": 1.9012902410760184e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2936327955600929e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1231232441453498e+04, - "cpu_time": 1.9006097923086782e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2939457381044340e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0083892606007305e+00, - "cpu_time": 2.6727717777505433e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3042254283673510e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7881412845044788e-04, - "cpu_time": 1.4057673678679965e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7881698529726938e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 61895, - "real_time": 1.1305508641197166e+04, - "cpu_time": 1.9570007044187776e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4492050309259737e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 61895, - "real_time": 1.1303384274021912e+04, - "cpu_time": 1.9514424638500688e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4494773956906562e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 61895, - "real_time": 1.1302871760642931e+04, - "cpu_time": 1.9519895128847336e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4495431202758374e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 61895, - "real_time": 1.1302028994345606e+04, - "cpu_time": 1.9519287325308964e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4496512093710694e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 61895, - "real_time": 1.1302028195233395e+04, - "cpu_time": 1.9707012844333243e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4496513118689542e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1303164373088201e+04, - "cpu_time": 1.9566125396235602e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4495056136264982e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1302871760642929e+04, - "cpu_time": 1.9519895128847336e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4495431202758374e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4326161825156427e+00, - "cpu_time": 8.1957841423473781e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8369748174648450e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2674470044216738e-04, - "cpu_time": 4.1887619425786749e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2673112819956199e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 61479, - "real_time": 1.1384522583293538e+04, - "cpu_time": 2.0428289513492407e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8782937325879703e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 61479, - "real_time": 1.1381058245145674e+04, - "cpu_time": 2.0443003757380502e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8791698710422139e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 61479, - "real_time": 1.1385724554857497e+04, - "cpu_time": 2.0432826721319554e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8779898760171723e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 61479, - "real_time": 1.1387604331271948e+04, - "cpu_time": 2.0491666731729521e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8775148000193954e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 61479, - "real_time": 1.1385422140967950e+04, - "cpu_time": 2.0439445631841787e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8780663197450995e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1384866371107320e+04, - "cpu_time": 2.0447046471152753e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8782069198823705e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1385422140967950e+04, - "cpu_time": 2.0439445631841783e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8780663197450995e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4063353226956146e+00, - "cpu_time": 2.5588614130795861e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0842372603309934e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1136263213439619e-04, - "cpu_time": 1.2514577186928668e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1138984894733176e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 54941, - "real_time": 1.2734861861678375e+04, - "cpu_time": 2.3746147813108568e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1461885265681839e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 54941, - "real_time": 1.2733176416079701e+04, - "cpu_time": 2.3772692033272044e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1468697093711720e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 54941, - "real_time": 1.2730788198142647e+04, - "cpu_time": 2.3735495531570126e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1478352306231403e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 54941, - "real_time": 1.2739053059107977e+04, - "cpu_time": 2.3770180065888835e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1444954107592840e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 54941, - "real_time": 1.2730228781196462e+04, - "cpu_time": 2.3756224750186579e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1480614470025692e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2733621663241032e+04, - "cpu_time": 2.3756148038805233e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1466900648648701e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2733176416079703e+04, - "cpu_time": 2.3756224750186579e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1468697093711720e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5628840626136649e+00, - "cpu_time": 1.5788745918626589e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4398275114471177e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7980131315656035e-04, - "cpu_time": 6.6461725582935254e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7975795964020644e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 48213, - "real_time": 1.4512786517639643e+04, - "cpu_time": 2.8967259680998875e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.0314840530926189e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 48213, - "real_time": 1.4514631850999684e+04, - "cpu_time": 2.8992502914151784e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.0303358256360130e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 48213, - "real_time": 1.4511096915076845e+04, - "cpu_time": 2.8954432020409298e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.0325356358014431e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 48213, - "real_time": 1.4517575662036143e+04, - "cpu_time": 2.9128858046584817e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.0285046932978535e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 48213, - "real_time": 1.4507999512431727e+04, - "cpu_time": 2.8921338601621839e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.0344640477611008e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4512818091636809e+04, - "cpu_time": 2.8992878252753329e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.0314648511178055e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4512786517639641e+04, - "cpu_time": 2.8967259680998879e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.0314840530926189e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6092364266970178e+00, - "cpu_time": 8.0223112151442251e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2460722359176250e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4869301082033722e-04, - "cpu_time": 2.7669937234956594e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4869412359387449e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 35885, - "real_time": 1.9503652301163569e+04, - "cpu_time": 4.1704425943987648e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3440764629728390e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 35885, - "real_time": 1.9505673235444865e+04, - "cpu_time": 4.1760593172634530e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3439372065540567e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 35885, - "real_time": 1.9493655795986044e+04, - "cpu_time": 4.1692334986763090e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3447657163105255e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 35885, - "real_time": 1.9506892032757292e+04, - "cpu_time": 4.1773433440155786e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3438532368959139e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 35885, - "real_time": 1.9500908330481030e+04, - "cpu_time": 4.1766456151595186e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3442655878252298e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9502156339166562e+04, - "cpu_time": 4.1739448739027248e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3441796421117130e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9503652301163565e+04, - "cpu_time": 4.1760593172634530e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3440764629728390e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2642666967243867e+00, - "cpu_time": 3.8005753328245717e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6291560008795434e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6993254515922719e-04, - "cpu_time": 9.1054756295115005e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6999040062666927e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18978, - "real_time": 3.6876979656136566e+04, - "cpu_time": 7.2179605121720087e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4217216401364233e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18978, - "real_time": 3.6883437564241212e+04, - "cpu_time": 7.2175693803351125e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4214727113947247e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18978, - "real_time": 3.6880359512123607e+04, - "cpu_time": 7.2193555854146922e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4215913481744989e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18978, - "real_time": 3.6885402110369170e+04, - "cpu_time": 7.2136797502371497e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4213970026169592e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18978, - "real_time": 3.6879230740539984e+04, - "cpu_time": 7.2104404521024073e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4216348591665972e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6881081916682109e+04, - "cpu_time": 7.2158011360522738e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4215635122978407e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6880359512123599e+04, - "cpu_time": 7.2175693803351111e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4215913481744989e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3537446171223699e+00, - "cpu_time": 3.6626804911756800e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2926707103667199e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.0934008516854248e-05, - "cpu_time": 5.0759166198134891e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0933025445850374e-05, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10907, - "real_time": 6.4194383454151131e+04, - "cpu_time": 1.2608297001925371e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6334388517788525e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10907, - "real_time": 6.4210323724423994e+04, - "cpu_time": 1.2608994920693096e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6330333491234962e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10907, - "real_time": 6.4209470387413596e+04, - "cpu_time": 1.2615314660309961e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6330550519624640e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10907, - "real_time": 6.4195000328876427e+04, - "cpu_time": 1.2601131447694119e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6334231554296381e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10907, - "real_time": 6.4199446652765684e+04, - "cpu_time": 1.2605655386448969e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6333100278440294e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4201724909526165e+04, - "cpu_time": 1.2607878683414301e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6332520872276960e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4199446652765677e+04, - "cpu_time": 1.2608297001925370e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6333100278440294e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7175035991993823e+00, - "cpu_time": 5.1764603680505537e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9632351918606185e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2020710674167989e-04, - "cpu_time": 4.1057345950355631e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2020405222276741e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6550, - "real_time": 1.0677043334554297e+05, - "cpu_time": 2.1394853374045939e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9641692313947544e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6550, - "real_time": 1.0669023875935351e+05, - "cpu_time": 2.1394195358778560e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9656456151815884e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6550, - "real_time": 1.0680951709274331e+05, - "cpu_time": 2.1392232732824475e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9634505024295082e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6550, - "real_time": 1.0661431870828490e+05, - "cpu_time": 2.1379896946564951e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9670453513267467e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6550, - "real_time": 1.0666321700248682e+05, - "cpu_time": 2.1381175511450254e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9661435862665810e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0670954498168229e+05, - "cpu_time": 2.1388470784732833e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9652908573198360e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0669023875935352e+05, - "cpu_time": 2.1392232732824475e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9656456151815884e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9512374606212887e+01, - "cpu_time": 7.3210682521826982e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4642574783855468e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.4512898185314096e-04, - "cpu_time": 3.4229040149090517e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4505891732607301e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3462, - "real_time": 2.0245742750965981e+05, - "cpu_time": 4.1901751704217051e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0716967767457569e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3462, - "real_time": 2.0235737586694708e+05, - "cpu_time": 4.1901999075678579e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0727210866570122e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3462, - "real_time": 2.0260366686405413e+05, - "cpu_time": 4.1930678249566950e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0702014257295517e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3462, - "real_time": 2.0247019112396904e+05, - "cpu_time": 4.1907609560947475e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0715661780710716e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3462, - "real_time": 2.0254256973164275e+05, - "cpu_time": 4.1940771981513733e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0708259036888943e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0248624621925462e+05, - "cpu_time": 4.1916562114384759e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0714022741784576e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0247019112396910e+05, - "cpu_time": 4.1907609560947475e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0715661780710716e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3080338548431882e+01, - "cpu_time": 1.8006675831297827e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5224767467292883e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5968721474367875e-04, - "cpu_time": 4.2958379511563917e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5971161012198919e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1763, - "real_time": 3.9708195553003781e+05, - "cpu_time": 7.9190511571185687e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1125633847558285e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1763, - "real_time": 3.9716761828858725e+05, - "cpu_time": 7.9207211684627854e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1121077383264229e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1763, - "real_time": 3.9707922189952352e+05, - "cpu_time": 7.9149212308565329e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1125779283718464e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1763, - "real_time": 3.9709228841335396e+05, - "cpu_time": 7.9195550482133124e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1125084129732239e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1763, - "real_time": 3.9691849420469423e+05, - "cpu_time": 7.9166218207600352e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1134333931222473e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9706791566723934e+05, - "cpu_time": 7.9181740850822465e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1126381715099136e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9708195553003781e+05, - "cpu_time": 7.9190511571185687e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1125633847558285e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1085626514805668e+01, - "cpu_time": 2.3534301238605821e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8471547123152567e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2939558428372112e-04, - "cpu_time": 2.9721879041462581e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2943610399934076e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 891, - "real_time": 7.8525694307173975e+05, - "cpu_time": 1.6449127441077416e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1365256490915562e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 891, - "real_time": 7.8536505651776295e+05, - "cpu_time": 1.6451486419753064e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1362315347194904e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 891, - "real_time": 7.8524887174008333e+05, - "cpu_time": 1.6447647789001123e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1365476097816341e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 891, - "real_time": 7.8527978784744395e+05, - "cpu_time": 1.6447648810325523e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1364634948759567e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 891, - "real_time": 7.8490627438298240e+05, - "cpu_time": 1.6445165241301809e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1374801740741119e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8521138671200257e+05, - "cpu_time": 1.6448215140291788e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1366496925085499e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8525694307173975e+05, - "cpu_time": 1.6447648810325521e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1365256490915562e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7668274297731315e+02, - "cpu_time": 2.3172215592021863e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8089312280214615e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2501296589336948e-04, - "cpu_time": 1.4087981823182057e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2506877214745948e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 74, - "real_time": 9.3687856066468600e+06, - "cpu_time": 1.8182425000000075e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5815134862510014e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 74, - "real_time": 9.3419033077520300e+06, - "cpu_time": 1.8164928364864897e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5918196640031705e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 74, - "real_time": 9.3595983485716414e+06, - "cpu_time": 1.8176359256756701e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5850290525683408e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 74, - "real_time": 9.3478838837630041e+06, - "cpu_time": 1.8174097067567669e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5895216946675010e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 74, - "real_time": 9.3690234337102715e+06, - "cpu_time": 1.8186915891891852e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5814225716705189e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3574389160887636e+06, - "cpu_time": 1.8176945116216239e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5858612938321061e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3595983485716414e+06, - "cpu_time": 1.8176359256756701e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5850290525683408e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2250156661297036e+04, - "cpu_time": 8.4009288058809070e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6957166682499060e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3091356268684440e-03, - "cpu_time": 4.6217495581180837e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3095087298348146e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 38, - "real_time": 1.8446339931535095e+07, - "cpu_time": 3.5774108578947723e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6380585118283267e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 38, - "real_time": 1.8424069852029022e+07, - "cpu_time": 3.5744602315789185e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6424560121068678e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 38, - "real_time": 1.8462937815408956e+07, - "cpu_time": 3.5762714657895036e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6347879557928047e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 38, - "real_time": 1.8405812743463013e+07, - "cpu_time": 3.5712793473684795e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6460690400011973e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 38, - "real_time": 1.8441905757706415e+07, - "cpu_time": 3.5764327131578974e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6389332470130897e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8436213220028497e+07, - "cpu_time": 3.5751709231579140e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6400609533484573e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8441905757706415e+07, - "cpu_time": 3.5762714657895043e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6389332470130897e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1913521117784545e+04, - "cpu_time": 2.4222954171585494e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3277999181847582e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1886129139566694e-03, - "cpu_time": 6.7753275835521706e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1889361122383558e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.6818379046101317e+07, - "cpu_time": 7.0261417052630812e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6454002451314392e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.6453281970400557e+07, - "cpu_time": 6.9833299315788329e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6819106742976532e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.6741174365344800e+07, - "cpu_time": 7.0126294473684117e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6530603694202418e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.6776467177428700e+07, - "cpu_time": 7.0241834263157442e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6495546826851058e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.6654158446349598e+07, - "cpu_time": 7.0112942684210420e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6617326297766032e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6688692201124996e+07, - "cpu_time": 7.0115157557894230e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6583317202622089e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6741174365344800e+07, - "cpu_time": 7.0126294473684117e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6530603694202418e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4481717675442545e+05, - "cpu_time": 1.7103496182132716e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4487752036663245e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.9471883042477294e-03, - "cpu_time": 2.4393436138270565e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9602073142850054e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 7.2386173158884048e+07, - "cpu_time": 1.3597544050000182e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7083802649823403e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 7.2506430000066757e+07, - "cpu_time": 1.3608556180000165e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7022296643173971e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 7.2236829996109009e+07, - "cpu_time": 1.3592034179999930e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7160470083537593e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 7.2265229374170303e+07, - "cpu_time": 1.3594704110000178e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7145866459526749e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 7.2461872547864914e+07, - "cpu_time": 1.3611050020000166e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7045061983829374e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2371307015419006e+07, - "cpu_time": 1.3600777708000124e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7091499563978219e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2386173158884048e+07, - "cpu_time": 1.3597544050000182e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7083802649823403e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1834047655179084e+05, - "cpu_time": 8.5120420418998212e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0657702492593639e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6351850122946917e-03, - "cpu_time": 6.2584965541293610e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6353531996722499e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4173555374145508e+08, - "cpu_time": 2.5795418499999982e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7878351467079711e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4091583788394928e+08, - "cpu_time": 2.5705348159999627e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8098692103164306e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4129660725593567e+08, - "cpu_time": 2.5759499079999843e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7996022864692445e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4074937403202057e+08, - "cpu_time": 2.5693423760000086e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8143751309178934e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4103874862194061e+08, - "cpu_time": 2.5718533279999748e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8065490317068934e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4114722430706027e+08, - "cpu_time": 2.5734444555999860e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8036461612236872e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4103874862194061e+08, - "cpu_time": 2.5718533279999748e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8065490317068934e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8472011943378701e+05, - "cpu_time": 4.2213817902065732e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0351387476778174e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7256654980110941e-03, - "cpu_time": 1.6403625036555834e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7214380723174273e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8250254690647125e+08, - "cpu_time": 4.4999255850000000e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8008217474778595e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8317712247371674e+08, - "cpu_time": 4.5039139699998999e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7917675503594398e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8178414702415466e+08, - "cpu_time": 4.4931131999999255e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8105118238179607e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8038373589515686e+08, - "cpu_time": 4.4791443999999106e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8295438948053012e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8191879391670227e+08, - "cpu_time": 4.4972750949999350e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8086918898966889e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8195326924324036e+08, - "cpu_time": 4.4946744499999344e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8082673812714500e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8191879391670227e+08, - "cpu_time": 4.4972750949999350e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8086918898966889e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0359474510012144e+06, - "cpu_time": 9.5305621240340301e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4014186034124136e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6741813768703109e-03, - "cpu_time": 2.1204121077187626e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6799375230436890e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 95703, - "real_time": 7.3070969064981473e+03, - "cpu_time": 1.4485881383028629e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5034433411214389e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 95703, - "real_time": 7.2920020579620013e+03, - "cpu_time": 1.4480511906628020e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5106956630720966e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 95703, - "real_time": 7.3078594307885824e+03, - "cpu_time": 1.4524155919877321e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5030777811824352e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 95703, - "real_time": 7.2923165002528740e+03, - "cpu_time": 1.4497821781971244e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5105442830288939e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 95703, - "real_time": 7.3074551601560606e+03, - "cpu_time": 1.4518093863306454e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5032715820938781e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3013460111315344e+03, - "cpu_time": 1.4501292970962337e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5062065300997488e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3070969064981491e+03, - "cpu_time": 1.4497821781971248e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5034433411214389e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3913744762428060e+00, - "cpu_time": 1.9276950270696339e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0313340913709944e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1492914407082516e-03, - "cpu_time": 1.3293263096812726e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1497708582661006e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 94027, - "real_time": 7.4687748491719658e+03, - "cpu_time": 1.4661183755729557e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8552073176601842e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 94027, - "real_time": 7.4579243466666403e+03, - "cpu_time": 1.4664585225520095e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8651809297159359e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 94027, - "real_time": 7.4886485245587619e+03, - "cpu_time": 1.4711133972157029e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8370146939185873e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 94027, - "real_time": 7.4489387259573432e+03, - "cpu_time": 1.4645652057387641e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8734623660660788e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 94027, - "real_time": 7.4701721772464925e+03, - "cpu_time": 1.4671595626787916e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8539250214273289e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4668917247202407e+03, - "cpu_time": 1.4670830127516450e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8569580657576233e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4687748491719658e+03, - "cpu_time": 1.4664585225520097e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8552073176601842e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4919700896671008e+01, - "cpu_time": 2.4448785179046162e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3693155018566758e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9981140006727497e-03, - "cpu_time": 1.6664895555698845e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9969722561011178e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 92284, - "real_time": 7.5751365104701845e+03, - "cpu_time": 1.4735591391790691e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3517908206467962e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 92284, - "real_time": 7.5754367733694098e+03, - "cpu_time": 1.4756365274587157e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3517372405506122e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 92284, - "real_time": 7.5759638018961550e+03, - "cpu_time": 1.4737282074899227e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3516432057710040e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 92284, - "real_time": 7.5788038073146090e+03, - "cpu_time": 1.4745653504399201e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3511367044647551e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 92284, - "real_time": 7.5780924283983850e+03, - "cpu_time": 1.4741316121971466e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3512635398357373e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5766866642897494e+03, - "cpu_time": 1.4743241673529552e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3515143022537810e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5759638018961541e+03, - "cpu_time": 1.4741316121971468e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3516432057710040e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6542522133683408e+00, - "cpu_time": 8.3035716415512759e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9506012268688562e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1833451568812012e-04, - "cpu_time": 5.6321206864971580e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1831816518319067e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 89399, - "real_time": 7.8338695177767031e+03, - "cpu_time": 1.5034665947046626e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6142891394254857e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 89399, - "real_time": 7.8166353913449348e+03, - "cpu_time": 1.5025878331972466e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6200531270368236e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 89399, - "real_time": 7.8252315796435823e+03, - "cpu_time": 1.5005076331950224e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6171749412856111e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 89399, - "real_time": 7.7995922832116903e+03, - "cpu_time": 1.5091966890009959e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6257782787034112e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 89399, - "real_time": 7.8061758806923417e+03, - "cpu_time": 1.5081939909842451e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6235637414543623e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8163009305338510e+03, - "cpu_time": 1.5047905482164346e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6201718455811393e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8166353913449329e+03, - "cpu_time": 1.5034665947046626e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6200531270368236e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3876411143236163e+01, - "cpu_time": 3.7398417989189781e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6513119418073865e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7753169007386732e-03, - "cpu_time": 2.4852905963236257e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7751934666620126e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 81827, - "real_time": 8.5525929885953356e+03, - "cpu_time": 1.5839829078421684e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7891908400901473e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 81827, - "real_time": 8.5491844269063404e+03, - "cpu_time": 1.5853951886296525e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7911002915189224e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 81827, - "real_time": 8.5546357588329174e+03, - "cpu_time": 1.5849764368729315e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7880472243026334e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 81827, - "real_time": 8.5522403773316237e+03, - "cpu_time": 1.5860266782357694e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7893882997685206e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 81827, - "real_time": 8.5560477345024246e+03, - "cpu_time": 1.5867600498613061e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7872570690352768e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5529402572337276e+03, - "cpu_time": 1.5854282522883655e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7889967449431002e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5525929885953356e+03, - "cpu_time": 1.5853951886296523e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7891908400901473e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6099726784582007e+00, - "cpu_time": 1.0519088993791625e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4615024816947797e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0515502271289600e-04, - "cpu_time": 6.6348565307882258e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0517925977670388e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65101, - "real_time": 1.0752662663904348e+04, - "cpu_time": 1.8286137570851486e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6185780732243681e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65101, - "real_time": 1.0751485786896974e+04, - "cpu_time": 1.8301837268245054e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6194120165082073e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65101, - "real_time": 1.0753878495564084e+04, - "cpu_time": 1.8305476444294116e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6177167180930638e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65101, - "real_time": 1.0753180563347960e+04, - "cpu_time": 1.8301387889587040e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6182111438938332e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65101, - "real_time": 1.0754335848207045e+04, - "cpu_time": 1.8288311961413830e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6173927573275149e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0753108671584083e+04, - "cpu_time": 1.8296630226878304e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6182621418093979e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0753180563347960e+04, - "cpu_time": 1.8301387889587037e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6182111438938332e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1109047379386485e+00, - "cpu_time": 8.7648954323831418e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8707396348754919e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0331010053625700e-04, - "cpu_time": 4.7904424605506015e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0331410876084829e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65150, - "real_time": 1.0744486905380823e+04, - "cpu_time": 1.8639259232540357e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5248750493422742e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65150, - "real_time": 1.0741371051804927e+04, - "cpu_time": 1.8624776822716700e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5253173846226003e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65150, - "real_time": 1.0742324511634144e+04, - "cpu_time": 1.8644973092862674e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5251820015543017e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65150, - "real_time": 1.0740897636024794e+04, - "cpu_time": 1.8616132663085147e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5253846145082262e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65150, - "real_time": 1.0743188642457273e+04, - "cpu_time": 1.8628071573292302e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5250593231929429e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0742453749460392e+04, - "cpu_time": 1.8630642676899439e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5251636746440692e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0742324511634142e+04, - "cpu_time": 1.8628071573292305e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5251820015543017e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4391157348848340e+00, - "cpu_time": 1.1523510448909857e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0431033179944669e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3396527166403883e-04, - "cpu_time": 6.1852458064681380e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3395961049696980e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 63856, - "real_time": 1.0957148571530412e+04, - "cpu_time": 1.9522181690052545e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9905590661734738e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 63856, - "real_time": 1.0960571229945122e+04, - "cpu_time": 1.9514721075544894e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9896252040655789e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 63856, - "real_time": 1.0955701674930830e+04, - "cpu_time": 1.9520881498997525e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9909540230527396e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 63856, - "real_time": 1.0961908421224569e+04, - "cpu_time": 1.9506200529315909e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9892605138494167e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 63856, - "real_time": 1.0958347221297619e+04, - "cpu_time": 1.9522223753445433e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9902319517960863e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0958735423785713e+04, - "cpu_time": 1.9517241709471262e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9901261517874589e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0958347221297621e+04, - "cpu_time": 1.9520881498997529e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9902319517960863e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5154785941051143e+00, - "cpu_time": 6.9053148503867039e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8634120680606086e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2954095493950144e-04, - "cpu_time": 3.5380587857533760e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2953586971431787e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 58475, - "real_time": 1.1993325763576277e+04, - "cpu_time": 2.2120903565626362e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.4643725428548603e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 58475, - "real_time": 1.1965530473486097e+04, - "cpu_time": 2.1966092997006814e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.4770659892779856e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 58475, - "real_time": 1.1983331821617317e+04, - "cpu_time": 2.1981481761436487e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.4689297580641479e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 58475, - "real_time": 1.1976305694413153e+04, - "cpu_time": 2.2010377186832142e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.4721382095792704e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 58475, - "real_time": 1.1982642226947566e+04, - "cpu_time": 2.2034386968790099e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.4692444920551147e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1980227196008082e+04, - "cpu_time": 2.2022648495938385e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.4703501983662758e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1982642226947564e+04, - "cpu_time": 2.2010377186832142e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.4692444920551147e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0227602046817895e+01, - "cpu_time": 6.0900862022350530e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6709590610237634e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.5370685208923443e-04, - "cpu_time": 2.7653741117278615e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5386837983768369e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 46478, - "real_time": 1.5058230192371906e+04, - "cpu_time": 2.8229377791643117e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7043429623221951e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 46478, - "real_time": 1.5057441671952050e+04, - "cpu_time": 2.8221912517750112e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7047987869115734e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 46478, - "real_time": 1.5059045740642539e+04, - "cpu_time": 2.8212202633503926e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7038715638038445e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 46478, - "real_time": 1.5060502110039095e+04, - "cpu_time": 2.8232264146477992e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7030298885340271e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 46478, - "real_time": 1.5059241940613156e+04, - "cpu_time": 2.8216089827445197e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7037581650450096e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5058892331123750e+04, - "cpu_time": 2.8222369383364065e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7039602733233318e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5059045740642541e+04, - "cpu_time": 2.8221912517750112e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7038715638038445e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1489113639386130e+00, - "cpu_time": 8.5151112057004159e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6405736619662610e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.6294546682164718e-05, - "cpu_time": 3.0171496553084323e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6293703710009789e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 32870, - "real_time": 2.1304701552579616e+04, - "cpu_time": 4.2469288226346296e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2304514069489939e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 32870, - "real_time": 2.1299141456136647e+04, - "cpu_time": 4.2476140158199087e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2307726137218166e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 32870, - "real_time": 2.1301231781317430e+04, - "cpu_time": 4.2445009339823097e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2306518359652674e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 32870, - "real_time": 2.1297721714321109e+04, - "cpu_time": 4.2496935138424000e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2308546590865067e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 32870, - "real_time": 2.1303816005949680e+04, - "cpu_time": 4.2467749558868156e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2305025537527597e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1301322502060899e+04, - "cpu_time": 4.2471024484332134e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2306466138950689e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1301231781317430e+04, - "cpu_time": 4.2469288226346303e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2306518359652674e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9734831233795695e+00, - "cpu_time": 1.8628335838519767e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7178846214108793e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3959147950048104e-04, - "cpu_time": 4.3861282049817034e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3959203251481540e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19178, - "real_time": 3.6495715189570343e+04, - "cpu_time": 6.9487739545312375e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4365741218569946e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19178, - "real_time": 3.6501886834145982e+04, - "cpu_time": 6.9550342110752128e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4363312296216717e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19178, - "real_time": 3.6495281776125419e+04, - "cpu_time": 6.9609603764730055e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4365911824332867e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19178, - "real_time": 3.6500052284785728e+04, - "cpu_time": 6.9537038898737839e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4364034218617773e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19178, - "real_time": 3.6496891446874113e+04, - "cpu_time": 6.9578344352904955e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4365278225494030e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6497965506300323e+04, - "cpu_time": 6.9552613734487473e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4364855556646269e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6496891446874113e+04, - "cpu_time": 6.9550342110752128e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4365278225494030e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8788623062211220e+00, - "cpu_time": 4.5733807168529921e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1330264903522776e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8877336483979349e-05, - "cpu_time": 6.5754261001773012e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8874896157800478e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10952, - "real_time": 6.3893991467844229e+04, - "cpu_time": 1.2383313659605748e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6411183210047445e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10952, - "real_time": 6.3886857875050082e+04, - "cpu_time": 1.2376943060628224e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6413015679231007e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10952, - "real_time": 6.3902401930079497e+04, - "cpu_time": 1.2380962089116144e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6409023265625088e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10952, - "real_time": 6.3901249809562498e+04, - "cpu_time": 1.2379117969320682e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6409319115431229e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10952, - "real_time": 6.3917975835004043e+04, - "cpu_time": 1.2376543745434539e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6405025132628775e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3900495383508074e+04, - "cpu_time": 1.2379376104821070e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6409513280592707e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3901249809562498e+04, - "cpu_time": 1.2379117969320682e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6409319115431229e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1597982718299061e+01, - "cpu_time": 2.8296767182931678e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9781180247935103e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8150066988827061e-04, - "cpu_time": 2.2857991342481047e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8148728569028841e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6486, - "real_time": 1.0828274912364381e+05, - "cpu_time": 2.1937398304039577e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9367369382221214e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6486, - "real_time": 1.0840640885262117e+05, - "cpu_time": 2.1947202836879331e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9345276927779095e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6486, - "real_time": 1.0827709507188562e+05, - "cpu_time": 2.1921728754239538e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9368380714385548e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6486, - "real_time": 1.0821213925531690e+05, - "cpu_time": 2.1916913999383696e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9380006849804131e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6486, - "real_time": 1.0827171454497991e+05, - "cpu_time": 2.1923060730804666e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9369343219634418e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0829002136968949e+05, - "cpu_time": 2.1929260925069364e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9366075418764877e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0827709507188562e+05, - "cpu_time": 2.1923060730804666e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9368380714385548e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1004902083222476e+01, - "cpu_time": 1.2607058694469814e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2691820700908124e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.5569201284779535e-04, - "cpu_time": 5.7489665235628258e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5536358949683259e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3413, - "real_time": 2.0526278121610425e+05, - "cpu_time": 4.1741573483739037e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0433826216084267e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3413, - "real_time": 2.0527880817025228e+05, - "cpu_time": 4.1745720714912866e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0432230863895927e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3413, - "real_time": 2.0523412843106448e+05, - "cpu_time": 4.1734313155581790e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0436678987378128e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3413, - "real_time": 2.0535428591880680e+05, - "cpu_time": 4.1734774304131191e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0424721019255222e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3413, - "real_time": 2.0511687597545853e+05, - "cpu_time": 4.1714242103721382e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0448361355219906e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0524937594233727e+05, - "cpu_time": 4.1734124752417259e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0435163688366692e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0526278121610422e+05, - "cpu_time": 4.1734774304131197e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0433826216084267e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6372432481308039e+01, - "cpu_time": 1.2100899471944820e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6010779984464739e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2081702847941173e-04, - "cpu_time": 2.8995215650818050e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2089596783327388e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1741, - "real_time": 4.0226981530205644e+05, - "cpu_time": 7.9087840436532616e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0853187788154472e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1741, - "real_time": 4.0202995102653588e+05, - "cpu_time": 7.9076870993681694e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0865629485018921e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1741, - "real_time": 4.0246546800055215e+05, - "cpu_time": 7.9111763584146101e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0843050316029827e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1741, - "real_time": 4.0215888465642353e+05, - "cpu_time": 7.9092285927629389e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0858939886822697e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1741, - "real_time": 4.0249294091319898e+05, - "cpu_time": 7.9115283055715193e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0841627634431171e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0228341197975341e+05, - "cpu_time": 7.9096808799540997e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0852487022091415e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0226981530205649e+05, - "cpu_time": 7.9092285927629389e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0853187788154472e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9810423223847258e+02, - "cpu_time": 1.6304506515831389e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0269281745758073e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9244941834301382e-04, - "cpu_time": 2.0613355662872209e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9247275564198430e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 878, - "real_time": 7.9726311112998019e+05, - "cpu_time": 1.6469884384965878e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1043512192883537e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 878, - "real_time": 7.9730738395642582e+05, - "cpu_time": 1.6472973416856921e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1042343690268524e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 878, - "real_time": 7.9727985047319473e+05, - "cpu_time": 1.6474641355353326e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1043070372395000e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 878, - "real_time": 7.9738171745976328e+05, - "cpu_time": 1.6475788143507938e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1040382081304237e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 878, - "real_time": 7.9673515471782535e+05, - "cpu_time": 1.6462299772209206e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1057456672590126e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9719344354743813e+05, - "cpu_time": 1.6471117414578656e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1045353001888283e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9727985047319462e+05, - "cpu_time": 1.6472973416856923e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1043070372395000e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6018160133558615e+02, - "cpu_time": 5.4071663294785424e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8713868347634161e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2637197839686412e-04, - "cpu_time": 3.2828169415468050e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2650375758234534e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 73, - "real_time": 9.4624256638631430e+06, - "cpu_time": 1.8319184465753257e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5460708693484225e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 73, - "real_time": 9.4536957139634099e+06, - "cpu_time": 1.8302043232876733e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5493454639585056e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 73, - "real_time": 9.4661209221980348e+06, - "cpu_time": 1.8324825863014169e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5446866013844094e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 73, - "real_time": 9.4769922378536779e+06, - "cpu_time": 1.8328240123287443e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5406203949365387e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 73, - "real_time": 9.4545590882636104e+06, - "cpu_time": 1.8310109438356113e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5490213437507310e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4627587252283767e+06, - "cpu_time": 1.8316880624657545e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5459489346757221e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4624256638631430e+06, - "cpu_time": 1.8319184465753257e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5460708693484225e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5312695830039338e+03, - "cpu_time": 1.0764175117132796e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5699368981313943e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0072400512117997e-03, - "cpu_time": 5.8766420646113942e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0067648925287938e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 37, - "real_time": 1.8649105234323323e+07, - "cpu_time": 3.6027656864864700e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5985031537324066e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 37, - "real_time": 1.8708283484384820e+07, - "cpu_time": 3.6101290054054476e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5871203285974112e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 37, - "real_time": 1.8669922257194649e+07, - "cpu_time": 3.6030885837839052e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5944908112372513e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 37, - "real_time": 1.8694757005652867e+07, - "cpu_time": 3.6069114810809545e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5897157678865695e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 37, - "real_time": 1.8672486314096965e+07, - "cpu_time": 3.6051602189188913e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5939972251759286e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8678910859130524e+07, - "cpu_time": 3.6056109951351345e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5927654573259144e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8672486314096965e+07, - "cpu_time": 3.6051602189188913e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5939972251759286e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3045045494842390e+04, - "cpu_time": 3.0317165110606835e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4323622997043012e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2337467461909124e-03, - "cpu_time": 8.4083294486044739e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2336909693524210e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.6943822314864710e+07, - "cpu_time": 7.0453714842104003e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6330222372793345e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.6944841475863203e+07, - "cpu_time": 7.0438998789472267e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6329220166687436e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.6954490958075777e+07, - "cpu_time": 7.0476276473683402e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6319733953923941e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.6837227250400342e+07, - "cpu_time": 7.0398208894738153e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6435350328529773e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.7088950213633083e+07, - "cpu_time": 7.0637820473683938e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6188063352266169e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6953866442567423e+07, - "cpu_time": 7.0481003894736350e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6320518034840136e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6944841475863203e+07, - "cpu_time": 7.0453714842103988e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6329220166687436e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9491690814443733e+04, - "cpu_time": 9.2165504968694033e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7893706635776833e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4217138673034121e-03, - "cpu_time": 1.3076644751874359e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4199463937013667e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 7.2995025664567947e+07, - "cpu_time": 1.3679419530000132e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6774486145608625e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 7.2632127255201340e+07, - "cpu_time": 1.3647891719999734e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6958225807819333e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 7.2951726615428925e+07, - "cpu_time": 1.3675623560000077e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6796312911835489e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 7.2671247273683548e+07, - "cpu_time": 1.3644674590000251e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6938330642524776e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 7.2966641187667847e+07, - "cpu_time": 1.3685615229999825e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6788791649267874e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2843353599309921e+07, - "cpu_time": 1.3666644926000005e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6851229431411219e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2951726615428925e+07, - "cpu_time": 1.3675623560000077e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6796312911835489e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7620024915247061e+05, - "cpu_time": 1.8960862381363672e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9216980194041543e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4188926023600843e-03, - "cpu_time": 1.3873823812669431e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4210041719258044e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4277456402778625e+08, - "cpu_time": 2.5927490179999495e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7602700148712497e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4287561774253845e+08, - "cpu_time": 2.5913620219999987e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7576104340450883e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4244477152824402e+08, - "cpu_time": 2.5887463320000282e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7689759072241483e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4251200258731842e+08, - "cpu_time": 2.5858315400000721e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7671978658152266e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4244345724582672e+08, - "cpu_time": 2.5890743520000115e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7690106824174905e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4261008262634277e+08, - "cpu_time": 2.5895526528000122e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7646129808746409e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4251200258731842e+08, - "cpu_time": 2.5890743520000115e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7671978658152266e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0141654597546675e+05, - "cpu_time": 2.6559448761464306e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3139804089063033e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4123583849481713e-03, - "cpu_time": 1.0256384913721025e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4115608791402761e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8518141806125641e+08, - "cpu_time": 4.5284428100001150e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7651184684458032e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8328181803226471e+08, - "cpu_time": 4.5093928150001264e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7903661853712931e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8465500473976135e+08, - "cpu_time": 4.5178910199999225e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7720813128918681e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8395973145961761e+08, - "cpu_time": 4.5145667199997777e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7813172257936811e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8482156991958618e+08, - "cpu_time": 4.5202631499998349e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7698753795337553e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8437990844249725e+08, - "cpu_time": 4.5181113029999554e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7757517144072809e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8465500473976135e+08, - "cpu_time": 4.5178910199999219e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7720813128918681e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5754731668162113e+05, - "cpu_time": 7.0709813432574994e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0070088840569383e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6638566726833314e-03, - "cpu_time": 1.5650303565037185e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6670421156519794e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 92192, - "real_time": 7.6470061936225911e+03, - "cpu_time": 1.4735546001822215e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3477153479161229e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 92192, - "real_time": 7.7360688849840117e+03, - "cpu_time": 1.4881879089291939e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3091742564095471e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 92192, - "real_time": 7.6780385725038341e+03, - "cpu_time": 1.4748878438475920e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3341848648269758e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 92192, - "real_time": 7.7269677177010526e+03, - "cpu_time": 1.4860594606906936e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3130719494731601e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 92192, - "real_time": 7.7054351745156409e+03, - "cpu_time": 1.4792860736289258e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3223302020199269e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6987033086654264e+03, - "cpu_time": 1.4803951774557256e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3252953241291463e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7054351745156409e+03, - "cpu_time": 1.4792860736289256e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3223302020199269e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6537666024219867e+01, - "cpu_time": 6.5415040431723867e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5809594096277820e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7459506567936174e-03, - "cpu_time": 4.4187553045227515e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7543428643945056e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 84260, - "real_time": 8.2756338836470331e+03, - "cpu_time": 1.5285839378115514e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.1868372525726579e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 84260, - "real_time": 8.2428742746565695e+03, - "cpu_time": 1.5296138642297588e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.2114255651598170e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 84260, - "real_time": 8.1516458716668440e+03, - "cpu_time": 1.5165444457630698e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.2809401691453330e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 84260, - "real_time": 8.3148246452872809e+03, - "cpu_time": 1.5386533218609246e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.1576764615257874e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 84260, - "real_time": 8.2209893435262256e+03, - "cpu_time": 1.5239406444339395e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.2279608767913572e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2411936037567903e+03, - "cpu_time": 1.5274672428198490e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.2129680650389910e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2428742746565695e+03, - "cpu_time": 1.5285839378115514e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.2114255651598170e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1313734726415518e+01, - "cpu_time": 8.1044393268626521e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6333981660264748e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.4399095172895027e-03, - "cpu_time": 5.3058023764235296e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4576243069702577e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 78618, - "real_time": 8.8908237153156697e+03, - "cpu_time": 1.5939233877737692e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1517493010642183e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 78618, - "real_time": 8.9785573182704265e+03, - "cpu_time": 1.6038865399781374e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1404950302163434e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 78618, - "real_time": 8.9036675759868540e+03, - "cpu_time": 1.5946283408379866e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1500878612783374e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 78618, - "real_time": 8.9181147769063300e+03, - "cpu_time": 1.5989921557403712e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1482247376448576e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 78618, - "real_time": 8.9296928252413218e+03, - "cpu_time": 1.5984793266173159e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1467359740589137e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9241712423441222e+03, - "cpu_time": 1.5979819501895161e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1474585808525342e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9181147769063318e+03, - "cpu_time": 1.5984793266173157e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1482247376448576e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3754524877483362e+01, - "cpu_time": 3.9953317665923961e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3279206832785188e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7823708175076464e-03, - "cpu_time": 2.5002358544278687e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7717445801511876e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72520, - "real_time": 9.6506697487261299e+03, - "cpu_time": 1.6734596856039519e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1221325082337752e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72520, - "real_time": 9.6559649508630937e+03, - "cpu_time": 1.6758456549916613e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1209687591263890e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72520, - "real_time": 9.6988680919900762e+03, - "cpu_time": 1.6989920173744860e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1115866104946464e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72520, - "real_time": 9.6531406106188624e+03, - "cpu_time": 1.6752738430777477e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1215893175192261e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72520, - "real_time": 9.6487985973182604e+03, - "cpu_time": 1.6740592939878607e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1225440445706999e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6614883999032863e+03, - "cpu_time": 1.6795260990071420e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1197642479889473e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6531406106188624e+03, - "cpu_time": 1.6752738430777477e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1215893175192261e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1068399076592591e+01, - "cpu_time": 1.0922873422559432e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6095391983364237e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1806577004018853e-03, - "cpu_time": 6.5035449160430027e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1745527610957508e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 68801, - "real_time": 1.0171003078527227e+04, - "cpu_time": 1.7330009156843873e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0271347559095478e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 68801, - "real_time": 1.0172770313411116e+04, - "cpu_time": 1.7368668885626765e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0264351536573094e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 68801, - "real_time": 1.0170226349932278e+04, - "cpu_time": 1.7342328890567758e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0274423194398957e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 68801, - "real_time": 1.0175800550583621e+04, - "cpu_time": 1.7385793200679538e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0252361272598630e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 68801, - "real_time": 1.0173228463795833e+04, - "cpu_time": 1.7320046292931245e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0262538235297841e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0172605751250016e+04, - "cpu_time": 1.7349369285329834e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0265004359592801e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0172770313411116e+04, - "cpu_time": 1.7342328890567758e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0264351536573094e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1709275030557089e+00, - "cpu_time": 2.7310235250557287e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5922381484686513e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1340918503491045e-04, - "cpu_time": 1.5741341832898846e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1339220708221834e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 61998, - "real_time": 1.1282195635630136e+04, - "cpu_time": 1.8745637294751603e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2609980047934687e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 61998, - "real_time": 1.1280371014615093e+04, - "cpu_time": 1.8733915110165141e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2621724847403216e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 61998, - "real_time": 1.1278370628988603e+04, - "cpu_time": 1.8719960724539993e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2634605383017313e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 61998, - "real_time": 1.1285610225489299e+04, - "cpu_time": 1.8749955385658210e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2588011071814489e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 61998, - "real_time": 1.1286838053634850e+04, - "cpu_time": 1.8769390351301980e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2580114652764249e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1282677111671597e+04, - "cpu_time": 1.8743771773283388e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2606887200586796e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1282195635630136e+04, - "cpu_time": 1.8745637294751599e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2609980047934687e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5359684123912061e+00, - "cpu_time": 1.8453648839572672e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2754651480521515e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1339799742503935e-04, - "cpu_time": 9.8452163538801491e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1339522127781861e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 61973, - "real_time": 1.1289896959867405e+04, - "cpu_time": 1.9014967760154068e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4512089931591742e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 61973, - "real_time": 1.1304008709715865e+04, - "cpu_time": 1.9238504816614106e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4493973262704451e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 61973, - "real_time": 1.1300877171571032e+04, - "cpu_time": 1.9185631694447868e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4497989626164851e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 61973, - "real_time": 1.1304104154766417e+04, - "cpu_time": 1.9236313620447942e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4493850884319415e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 61973, - "real_time": 1.1295308169207492e+04, - "cpu_time": 1.9160806932051179e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4505137668279786e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1298839033025642e+04, - "cpu_time": 1.9167244964743033e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4500608274612050e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1300877171571032e+04, - "cpu_time": 1.9185631694447868e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4497989626164851e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1446876357963767e+00, - "cpu_time": 9.1400646634875983e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8880745432583231e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4383354058199472e-04, - "cpu_time": 4.7685855115329216e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4398232087056095e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 60843, - "real_time": 1.1508933404448473e+04, - "cpu_time": 1.9998803066909571e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8471795646444874e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 60843, - "real_time": 1.1505664958557136e+04, - "cpu_time": 2.0043709531088109e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8479883707746396e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 60843, - "real_time": 1.1519615624062999e+04, - "cpu_time": 2.0221486876058203e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8445393552500014e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 60843, - "real_time": 1.1514726975193775e+04, - "cpu_time": 2.0129563893956012e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8457470221041489e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 60843, - "real_time": 1.1510779878535859e+04, - "cpu_time": 2.0031563417319830e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8467228411779866e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1511944168159647e+04, - "cpu_time": 2.0085025357066344e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8464354307902527e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1510779878535857e+04, - "cpu_time": 2.0043709531088105e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8467228411779866e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3954608761588752e+00, - "cpu_time": 9.0284117140508172e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3338826315984477e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6868372512454760e-04, - "cpu_time": 4.4950959999034441e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6861510265424266e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 54901, - "real_time": 1.2759609653284186e+04, - "cpu_time": 2.3437281506711955e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1362072806930847e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 54901, - "real_time": 1.2752233471726131e+04, - "cpu_time": 2.3455536729749485e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1391781796737375e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 54901, - "real_time": 1.2761757529082293e+04, - "cpu_time": 2.3443068596199817e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1353428280276012e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 54901, - "real_time": 1.2753227187896900e+04, - "cpu_time": 2.3456732573176356e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1387777410720892e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 54901, - "real_time": 1.2752728836735010e+04, - "cpu_time": 2.3451943716871883e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1389785542384911e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2755911335744906e+04, - "cpu_time": 2.3448912624541903e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1376969167410002e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2753227187896900e+04, - "cpu_time": 2.3451943716871883e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1387777410720892e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4360782934329608e+00, - "cpu_time": 8.4210073033957329e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7864535422338864e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4776647286674696e-04, - "cpu_time": 3.5912144150267367e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4771485573872445e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 45241, - "real_time": 1.5476406945272227e+04, - "cpu_time": 2.9138227824318459e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4691492323442822e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 45241, - "real_time": 1.5474543299298874e+04, - "cpu_time": 2.9156617095113321e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4701691975580740e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 45241, - "real_time": 1.5476827885679177e+04, - "cpu_time": 2.9137750801264181e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4689188875248709e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 45241, - "real_time": 1.5475031397127512e+04, - "cpu_time": 2.9143987820781917e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4699020400262127e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 45241, - "real_time": 1.5478892873065035e+04, - "cpu_time": 2.9139396189297207e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4677890773492985e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5476340480088566e+04, - "cpu_time": 2.9143195946155018e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4691856869605474e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5476406945272227e+04, - "cpu_time": 2.9139396189297211e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4691492323442822e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7102813025203480e+00, - "cpu_time": 7.8981689925381406e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3587981450611493e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1050941304378443e-04, - "cpu_time": 2.7101245200186009e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1050410855284801e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 30081, - "real_time": 2.3274300452187825e+04, - "cpu_time": 4.4335092583357800e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1263238632607666e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 30081, - "real_time": 2.3269763166495082e+04, - "cpu_time": 4.4317280143612865e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1265434810159454e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 30081, - "real_time": 2.3274316409540097e+04, - "cpu_time": 4.4317963598283568e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1263230910298515e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 30081, - "real_time": 2.3269740992675015e+04, - "cpu_time": 4.4337733419767705e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1265445545032890e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 30081, - "real_time": 2.3273507487397983e+04, - "cpu_time": 4.4322753997540807e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1263622388758736e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3272325701659203e+04, - "cpu_time": 4.4326164748512543e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1264194457371452e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3273507487397983e+04, - "cpu_time": 4.4322753997540800e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1263622388758736e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3720498542241866e+00, - "cpu_time": 9.6354641753410117e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1481487178932875e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0192577590365502e-04, - "cpu_time": 2.1737644639477518e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0192905691022782e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18929, - "real_time": 3.6981028695621171e+04, - "cpu_time": 7.1140195044640423e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4177215142262377e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18929, - "real_time": 3.6978307260303998e+04, - "cpu_time": 7.1139334460353755e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4178258520849606e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18929, - "real_time": 3.6980056665507065e+04, - "cpu_time": 7.1133680648737922e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4177587793937229e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18929, - "real_time": 3.6976818635853939e+04, - "cpu_time": 7.1178151513551100e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4178829313661751e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18929, - "real_time": 3.6982346897033065e+04, - "cpu_time": 7.1236487453115129e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4176709808594147e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6979711630863851e+04, - "cpu_time": 7.1165569824079663e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4177720115861023e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6980056665507058e+04, - "cpu_time": 7.1140195044640423e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4177587793937229e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1874649786467075e+00, - "cpu_time": 4.3407091180081792e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.3866382413932704e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.9153110778208852e-05, - "cpu_time": 6.0994510811033381e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9153645105540609e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10894, - "real_time": 6.4247751014648842e+04, - "cpu_time": 1.2555978612080037e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6320820315732435e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10894, - "real_time": 6.4253140765407108e+04, - "cpu_time": 1.2548435735267428e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6319451275205790e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10894, - "real_time": 6.4236030084096295e+04, - "cpu_time": 1.2551082797870271e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6323798320463282e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10894, - "real_time": 6.4245549445055054e+04, - "cpu_time": 1.2549159693409030e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6321379598391905e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10894, - "real_time": 6.4246091122534017e+04, - "cpu_time": 1.2553677528915314e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6321241988093761e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4245712486348275e+04, - "cpu_time": 1.2551666873508417e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6321338299577436e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4246091122534024e+04, - "cpu_time": 1.2551082797870270e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6321241988093761e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1897856023771869e+00, - "cpu_time": 3.1504434352338070e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5725657477638256e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.6345504825593925e-05, - "cpu_time": 2.5099801221486697e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6350294252802772e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6546, - "real_time": 1.0689663948368719e+05, - "cpu_time": 2.1925106034219681e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9618502603349220e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6546, - "real_time": 1.0715120637713716e+05, - "cpu_time": 2.1947155163458386e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9571893503641125e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6546, - "real_time": 1.0692132338219209e+05, - "cpu_time": 2.1915087549648763e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9613973468170559e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6546, - "real_time": 1.0694065852929560e+05, - "cpu_time": 2.1922696532232899e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9610427211138786e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6546, - "real_time": 1.0716433267373120e+05, - "cpu_time": 2.1935153437213899e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9569496190350163e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0701483208920865e+05, - "cpu_time": 2.1929039743354730e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9596858595329967e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0694065852929562e+05, - "cpu_time": 2.1925106034219678e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9610427211138786e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3149473226223921e+02, - "cpu_time": 1.2408865805341532e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4069930933797047e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2287524046444690e-03, - "cpu_time": 5.6586453171538701e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2282545601228676e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3431, - "real_time": 2.0403573874050155e+05, - "cpu_time": 4.1740139376274816e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0556712397010189e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3431, - "real_time": 2.0416741239648563e+05, - "cpu_time": 4.1746858758380730e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0543454759836086e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3431, - "real_time": 2.0411382080581694e+05, - "cpu_time": 4.1740530661614961e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0548848595560013e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3431, - "real_time": 2.0403365879212390e+05, - "cpu_time": 4.1730719790148246e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0556921955084347e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3431, - "real_time": 2.0409777948446356e+05, - "cpu_time": 4.1753563858933031e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0550463658127556e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0408968204387830e+05, - "cpu_time": 4.1742362489070359e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0551280273123638e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0409777948446354e+05, - "cpu_time": 4.1740530661614961e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0550463658127556e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6433015089434150e+01, - "cpu_time": 8.5078990560854535e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6823216906894669e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7651086779243117e-04, - "cpu_time": 2.0381929887924112e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7649477867909967e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1751, - "real_time": 3.9971269089260540e+05, - "cpu_time": 7.8951837178757635e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0986594099044624e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1751, - "real_time": 3.9979967271785717e+05, - "cpu_time": 7.8957203026841232e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0982028181698708e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1751, - "real_time": 3.9973333706017659e+05, - "cpu_time": 7.8943416504855407e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0985510144572113e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1751, - "real_time": 3.9971423956210795e+05, - "cpu_time": 7.8959001941749558e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0986512787710110e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1751, - "real_time": 3.9973726863696269e+05, - "cpu_time": 7.8956867732724454e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0985303743640800e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9973944177394197e+05, - "cpu_time": 7.8953665276985662e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0985189791333271e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9973333706017659e+05, - "cpu_time": 7.8956867732724454e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0985510144572113e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5427806060258519e+01, - "cpu_time": 6.3172513200629204e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8596899264985011e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.8627246545997380e-05, - "cpu_time": 8.0012134938899998e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8619161655928376e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 885, - "real_time": 7.9061869942283223e+05, - "cpu_time": 1.6416652372881004e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1220363257595234e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 885, - "real_time": 7.9065828253962309e+05, - "cpu_time": 1.6419627333333290e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1219300892050323e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 885, - "real_time": 7.9070367754337064e+05, - "cpu_time": 1.6418550508474433e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1218082673050121e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 885, - "real_time": 7.9086530581379763e+05, - "cpu_time": 1.6420794158192247e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1213746356892345e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 885, - "real_time": 7.9061616814595321e+05, - "cpu_time": 1.6418119412429214e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1220431197788013e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9069242669311538e+05, - "cpu_time": 1.6418748757062037e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1218384875475208e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9065828253962309e+05, - "cpu_time": 1.6418550508474433e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1219300892050323e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0299353355018795e+02, - "cpu_time": 1.5641104098090767e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7634986122377552e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3025739222131434e-04, - "cpu_time": 9.5263678916843194e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3024076188908624e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 74, - "real_time": 9.3526977013695892e+06, - "cpu_time": 1.8102958851351239e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5876741739537206e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 74, - "real_time": 9.3274740628092680e+06, - "cpu_time": 1.8077036054053623e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5973760713834682e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 74, - "real_time": 9.3412902583745681e+06, - "cpu_time": 1.8085674121622145e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5920553876289291e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 74, - "real_time": 9.3299410733822230e+06, - "cpu_time": 1.8077241283783771e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5964248580013905e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 74, - "real_time": 9.3733573684821259e+06, - "cpu_time": 1.8129512040540911e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5797666386674466e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3449520928835552e+06, - "cpu_time": 1.8094484470270343e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5906594259269915e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3412902583745699e+06, - "cpu_time": 1.8085674121622153e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5920553876289291e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8782141826391362e+04, - "cpu_time": 2.2238158453729236e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2087929966451386e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0098703171196023e-03, - "cpu_time": 1.2290020470197450e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0076515596530193e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 38, - "real_time": 1.8299787452346399e+07, - "cpu_time": 3.5437828473682858e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6671936313334227e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 38, - "real_time": 1.8269395749819905e+07, - "cpu_time": 3.5415403815788619e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6732941208885651e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 38, - "real_time": 1.8316469449353844e+07, - "cpu_time": 3.5464891368422367e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6638536801843882e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 38, - "real_time": 1.8258507118413322e+07, - "cpu_time": 3.5411903263158262e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6754847241767163e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 38, - "real_time": 1.8281281925737858e+07, - "cpu_time": 3.5422041184210986e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6709058080614548e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8285088339134265e+07, - "cpu_time": 3.5430413621052623e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6701463929289093e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8281281925737858e+07, - "cpu_time": 3.5422041184210986e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6709058080614548e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3281674367520322e+04, - "cpu_time": 2.1689400661976448e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6717159023211161e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2732601525195927e-03, - "cpu_time": 6.1216899395971733e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2728963376833909e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.6181032265487470e+07, - "cpu_time": 6.9239815578947335e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7096157736778622e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.6201057269384988e+07, - "cpu_time": 6.9250991789473176e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7075637598437524e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.6112442612648010e+07, - "cpu_time": 6.9190219052631482e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7166615794909320e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.6145503975843132e+07, - "cpu_time": 6.9222580157893270e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7132620446985826e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.6162665603976503e+07, - "cpu_time": 6.9254336736841992e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7114998509745150e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6160540345468022e+07, - "cpu_time": 6.9231588663157448e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7117206017371287e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6162665603976496e+07, - "cpu_time": 6.9239815578947335e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7114998509745150e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3932067965033784e+04, - "cpu_time": 2.6240408455068489e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4838080509235868e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.3837281304029159e-04, - "cpu_time": 3.7902363591192135e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3859652294225047e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 7.1464590728282928e+07, - "cpu_time": 1.3447244660000023e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7562022431587729e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 7.1534256637096405e+07, - "cpu_time": 1.3460246890000463e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7525441462516589e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 7.1393281221389771e+07, - "cpu_time": 1.3442137650000066e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7599540377978234e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 7.1437073498964310e+07, - "cpu_time": 1.3448762660000283e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7576491148379946e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 7.1296973526477814e+07, - "cpu_time": 1.3436028550000289e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7650329701626139e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1425235122442260e+07, - "cpu_time": 1.3446884082000226e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7582765024417725e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1437073498964310e+07, - "cpu_time": 1.3447244660000023e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7576491148379946e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8100497034425600e+04, - "cpu_time": 8.9804635322234841e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6373498685693322e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2334645714976984e-03, - "cpu_time": 6.6784717392221610e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2339033239189348e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4046575725078583e+08, - "cpu_time": 2.5566771159999460e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8220768001234446e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4037536084651947e+08, - "cpu_time": 2.5562989539999992e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8245380725111165e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4046006500720978e+08, - "cpu_time": 2.5554949820000276e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8222316924916883e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4070118069648743e+08, - "cpu_time": 2.5598838459999341e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8156816406402969e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4054018855094910e+08, - "cpu_time": 2.5566251120000061e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8200525951718912e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4050851047039032e+08, - "cpu_time": 2.5569960019999829e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8209161601876879e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4046575725078583e+08, - "cpu_time": 2.5566251120000061e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.8220768001234446e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2250402018009359e+05, - "cpu_time": 1.6820989559679112e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3294856433989923e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7186192330968547e-04, - "cpu_time": 6.5784184044567881e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7138411412707997e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8219200670719147e+08, - "cpu_time": 4.4832862500001627e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8050043887817764e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8125417232513428e+08, - "cpu_time": 4.4789055699999380e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8176920723463526e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8237935900688171e+08, - "cpu_time": 4.4877186600001550e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8024798546760368e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8024043142795563e+08, - "cpu_time": 4.4696101200000268e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8315021802128439e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8129057586193085e+08, - "cpu_time": 4.4793459050001162e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8171980014255342e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8147130906581879e+08, - "cpu_time": 4.4797733010000801e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8147752994885087e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8129057586193085e+08, - "cpu_time": 4.4793459050001162e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.8171980014255342e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5715115357234213e+05, - "cpu_time": 6.7025258818194945e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1627706636877282e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0452523080137712e-03, - "cpu_time": 1.4961752373324785e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0480711769409704e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 96202, - "real_time": 7.2664447630337399e+03, - "cpu_time": 1.4373250878360090e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5230433636864252e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 96202, - "real_time": 7.2654833886892329e+03, - "cpu_time": 1.4435524583688983e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5235095354912780e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 96202, - "real_time": 7.2608465320837122e+03, - "cpu_time": 1.4356411218061749e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5257596875075847e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 96202, - "real_time": 7.2623431099879590e+03, - "cpu_time": 1.4459369753227400e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5250331211688571e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 96202, - "real_time": 7.2692022134514818e+03, - "cpu_time": 1.4384846915864460e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5217069560436524e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2648640014492266e+03, - "cpu_time": 1.4401880669840535e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5238105327795595e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2654833886892347e+03, - "cpu_time": 1.4384846915864462e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5235095354912780e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3240594513686950e+00, - "cpu_time": 4.3629670029436930e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6123049804550006e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5755288064657472e-04, - "cpu_time": 3.0294425450145060e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5754587695815319e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 94471, - "real_time": 7.4064800751733565e+03, - "cpu_time": 1.4521985170052581e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9128654205961138e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 94471, - "real_time": 7.4215074114785921e+03, - "cpu_time": 1.4607158927077888e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8988680009684712e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 94471, - "real_time": 7.4168397348885401e+03, - "cpu_time": 1.4538853203628289e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9032096998344302e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 94471, - "real_time": 7.4139133770268318e+03, - "cpu_time": 1.4588496099332509e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9059344770133406e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 94471, - "real_time": 7.4069081445264437e+03, - "cpu_time": 1.4523027130018960e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9124659035816148e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4131297486187523e+03, - "cpu_time": 1.4555904106022044e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9066687003987953e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4139133770268327e+03, - "cpu_time": 1.4538853203628289e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9059344770133406e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4708929252362521e+00, - "cpu_time": 3.9406274088685727e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0282996441782816e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7289621855626343e-04, - "cpu_time": 2.7072364452018216e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7282305054391910e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 92380, - "real_time": 7.6059781134890673e+03, - "cpu_time": 1.4669208032041302e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3463094223002750e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 92380, - "real_time": 7.5750815511779520e+03, - "cpu_time": 1.4741868348127591e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3518006282595921e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 92380, - "real_time": 7.6035603673996739e+03, - "cpu_time": 1.4673846189651169e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3467375157438195e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 92380, - "real_time": 7.5774925691872531e+03, - "cpu_time": 1.4716679075557504e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3513705102977517e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 92380, - "real_time": 7.6016205798805686e+03, - "cpu_time": 1.4673634823554430e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3470811772824475e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5927466362269042e+03, - "cpu_time": 1.4695047293786400e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3486598507767773e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6016205798805695e+03, - "cpu_time": 1.4673846189651169e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3470811772824475e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5128594113004940e+01, - "cpu_time": 3.2541486052255834e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6890636956011289e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9925061164062304e-03, - "cpu_time": 2.2144526248660361e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9938783630671065e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 89028, - "real_time": 7.8676131316642268e+03, - "cpu_time": 1.4978823111830128e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6030766456443560e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 89028, - "real_time": 7.8621279535948834e+03, - "cpu_time": 1.5034252482364820e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6048927365314266e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 89028, - "real_time": 7.8841600722453222e+03, - "cpu_time": 1.5139948533045606e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5976134188467234e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 89028, - "real_time": 7.8992004409977508e+03, - "cpu_time": 1.5245964292132494e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5926674671662295e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 89028, - "real_time": 7.8753104734372091e+03, - "cpu_time": 1.5046714415689152e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6005323941293997e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8776824143878785e+03, - "cpu_time": 1.5089140567012440e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5997565324636269e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8753104734372073e+03, - "cpu_time": 1.5046714415689150e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6005323941293997e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4611154381570291e+01, - "cpu_time": 1.0506872898595900e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8180257328079932e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8547529099274594e-03, - "cpu_time": 6.9632016826497081e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8532603621317766e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 81105, - "real_time": 8.6338346017745935e+03, - "cpu_time": 1.5834523124345493e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7441260910396767e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 81105, - "real_time": 8.6318693508656488e+03, - "cpu_time": 1.5886256174095231e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7452062044813406e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 81105, - "real_time": 8.6353042296769454e+03, - "cpu_time": 1.5830950804512622e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7433186961998159e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 81105, - "real_time": 8.6274368194665221e+03, - "cpu_time": 1.5880012785894267e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7476441563246083e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 81105, - "real_time": 8.6382240711759569e+03, - "cpu_time": 1.5831656519327717e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7417153876194763e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6333338145919333e+03, - "cpu_time": 1.5852679881635067e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7444021071329844e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6338346017745916e+03, - "cpu_time": 1.5834523124345495e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7441260910396767e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0301097504032413e+00, - "cpu_time": 2.7920679886204898e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2150553798945976e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6680805317542677e-04, - "cpu_time": 1.7612593009305832e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6687766548378487e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65648, - "real_time": 1.0667344964694181e+04, - "cpu_time": 1.8102275210210897e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6795116564741695e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65648, - "real_time": 1.0663728114279704e+04, - "cpu_time": 1.8130067877163485e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6821163407478154e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65648, - "real_time": 1.0668741626170931e+04, - "cpu_time": 1.8102591579332820e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6785063197187507e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65648, - "real_time": 1.0660874456546591e+04, - "cpu_time": 1.8125253671094786e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6841726571214676e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65648, - "real_time": 1.0667123390765371e+04, - "cpu_time": 1.8106359310260570e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6796711727286208e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0665562510491356e+04, - "cpu_time": 1.8113309529612514e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6807956293581653e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0667123390765370e+04, - "cpu_time": 1.8106359310260570e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6796711727286208e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2040258271036870e+00, - "cpu_time": 1.3308276933298178e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3077328060241291e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0040851797099254e-04, - "cpu_time": 7.3472365232544405e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0045491605105648e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65143, - "real_time": 1.0746032068928584e+04, - "cpu_time": 1.8378897272155737e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5246557887513864e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65143, - "real_time": 1.0743590658756824e+04, - "cpu_time": 1.8428176089526572e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5250022567311633e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65143, - "real_time": 1.0744440248496807e+04, - "cpu_time": 1.8378791627650884e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5248816709918592e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65143, - "real_time": 1.0742134166523789e+04, - "cpu_time": 1.8422394716239509e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5252090269974675e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65143, - "real_time": 1.0746014628181296e+04, - "cpu_time": 1.8376108008536103e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5246582632628429e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0744442354177461e+04, - "cpu_time": 1.8396873542821762e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5248814013469439e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0744440248496809e+04, - "cpu_time": 1.8378897272155737e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5248816709918592e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6622543707020045e+00, - "cpu_time": 2.6040780999708119e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3592176194662502e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5470829624356607e-04, - "cpu_time": 1.4155003533124198e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5471482683061965e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 64449, - "real_time": 1.0869701593967320e+04, - "cpu_time": 1.9511934351192049e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0146181766559467e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 64449, - "real_time": 1.0864411030406493e+04, - "cpu_time": 1.9533302316561821e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0160861834379606e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 64449, - "real_time": 1.0870163302242852e+04, - "cpu_time": 1.9507452652485652e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0144901312787952e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 64449, - "real_time": 1.0863072844010307e+04, - "cpu_time": 1.9534962078543129e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0164577252252946e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 64449, - "real_time": 1.0871230880597790e+04, - "cpu_time": 1.9513298608201505e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0141941018364377e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0867715930244955e+04, - "cpu_time": 1.9520190001396830e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0151692636868873e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0869701593967320e+04, - "cpu_time": 1.9513298608201505e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0146181766559467e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7002695412805728e+00, - "cpu_time": 1.2923178689407024e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0267343050273523e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4048272562799408e-04, - "cpu_time": 6.6204164449640420e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4052294091505914e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 60185, - "real_time": 1.1642063071351055e+04, - "cpu_time": 2.1606578798704017e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.6292428239176846e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 60185, - "real_time": 1.1631883965167330e+04, - "cpu_time": 2.1622182553791979e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.6341689958611298e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 60185, - "real_time": 1.1636174678325528e+04, - "cpu_time": 2.1596509080337048e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.6320914571755791e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 60185, - "real_time": 1.1632397094612916e+04, - "cpu_time": 2.1616471745451407e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.6339204608438282e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 60185, - "real_time": 1.1640040073558923e+04, - "cpu_time": 2.1609633297333738e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.6302211664089642e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1636511776603151e+04, - "cpu_time": 2.1610275095123638e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.6319289808414373e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1636174678325528e+04, - "cpu_time": 2.1609633297333734e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.6320914571755791e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5201392260400048e+00, - "cpu_time": 9.7949441184136941e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1875858597458522e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8844451952761157e-04, - "cpu_time": 4.5325402269515413e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8842568277894305e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 44362, - "real_time": 1.5785923949672193e+04, - "cpu_time": 2.8984440579774848e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.3030933392227459e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 44362, - "real_time": 1.5778865967259339e+04, - "cpu_time": 2.9007498106488514e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.3068073632142115e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 44362, - "real_time": 1.5786922935847993e+04, - "cpu_time": 2.8992191244760212e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.3025679248974857e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 44362, - "real_time": 1.5778584441664143e+04, - "cpu_time": 2.9011012645958523e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.3069555754252462e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 44362, - "real_time": 1.5787871451382356e+04, - "cpu_time": 2.8986749808395522e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.3020691170197983e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5783633749165205e+04, - "cpu_time": 2.8996378477075523e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.3042986639558983e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5785923949672191e+04, - "cpu_time": 2.8992191244760208e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.3030933392227459e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5345655198741976e+00, - "cpu_time": 1.2150747143768632e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3859953571790536e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8729540940558319e-04, - "cpu_time": 4.1904361102801125e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8732051359559881e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 30923, - "real_time": 2.2644833975138725e+04, - "cpu_time": 4.2603064450411257e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1576326869422060e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 30923, - "real_time": 2.2637062632822155e+04, - "cpu_time": 4.2641071888239327e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1580301042234587e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 30923, - "real_time": 2.2646143323922930e+04, - "cpu_time": 4.2613350483457274e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1575657552386694e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 30923, - "real_time": 2.2632685435027237e+04, - "cpu_time": 4.2659576981534192e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1582540691096939e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 30923, - "real_time": 2.2644922226212861e+04, - "cpu_time": 4.2593070594699937e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1576281754527403e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2641129518624781e+04, - "cpu_time": 4.2622026879668396e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1578221581933538e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2644833975138728e+04, - "cpu_time": 4.2613350483457267e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1576326869422060e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9390230780575681e+00, - "cpu_time": 2.7595482032442931e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0375142915482717e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6231125409057344e-04, - "cpu_time": 6.4744649780150529e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6234722405796393e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19306, - "real_time": 3.6270016264082005e+04, - "cpu_time": 6.9178648554852480e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4455135508698391e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19306, - "real_time": 3.6263593349748327e+04, - "cpu_time": 6.9244960116024842e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4457695765100969e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19306, - "real_time": 3.6269030237846062e+04, - "cpu_time": 6.9223650056978513e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4455528492540592e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19306, - "real_time": 3.6258413668410503e+04, - "cpu_time": 6.9237338340410148e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4459761113508852e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19306, - "real_time": 3.6268117870411101e+04, - "cpu_time": 6.9255157930175177e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4455892138470575e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6265834278099603e+04, - "cpu_time": 6.9227950999688241e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4456802603663877e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6268117870411101e+04, - "cpu_time": 6.9237338340410133e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4455892138470575e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8219593504577505e+00, - "cpu_time": 2.9861674604806666e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9223702383047862e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3296148968975079e-04, - "cpu_time": 4.3135285926548860e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3297340297207819e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10978, - "real_time": 6.3790706671090782e+04, - "cpu_time": 1.2231988467845753e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6437754881859657e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10978, - "real_time": 6.3778274123413365e+04, - "cpu_time": 1.2227199927127409e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6440959157517588e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10978, - "real_time": 6.3791916091926571e+04, - "cpu_time": 1.2229677883038373e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6437443241067760e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10978, - "real_time": 6.3796056314618560e+04, - "cpu_time": 1.2228409327746443e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6436376487424408e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10978, - "real_time": 6.3794379386663633e+04, - "cpu_time": 1.2226748260156497e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6436808541462311e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3790266517542594e+04, - "cpu_time": 1.2228804773182896e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6437868461866346e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3791916091926571e+04, - "cpu_time": 1.2228409327746443e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6437443241067760e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0208579696398186e+00, - "cpu_time": 2.1130183560537475e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8093874520621612e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1006158702455104e-04, - "cpu_time": 1.7279025998415492e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1007433574856119e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6833, - "real_time": 1.0241791065166752e+05, - "cpu_time": 2.1303915249523858e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0476418496102711e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6833, - "real_time": 1.0244420847866956e+05, - "cpu_time": 2.1311812103030505e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0471162119785995e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6833, - "real_time": 1.0239216187781883e+05, - "cpu_time": 2.1301388628712634e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0481567744437916e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6833, - "real_time": 1.0240240022459165e+05, - "cpu_time": 2.1313303717253910e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0479519966333511e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6833, - "real_time": 1.0244914368415826e+05, - "cpu_time": 2.1280671022976434e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0470175977901150e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0242116498338120e+05, - "cpu_time": 2.1302218144299471e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0475768860912258e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0241791065166754e+05, - "cpu_time": 2.1303915249523861e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0476418496102711e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5088330639421443e+01, - "cpu_time": 1.3065036084359431e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0155326679905094e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4495259982145552e-04, - "cpu_time": 6.1331810592953073e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4494966230865394e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3580, - "real_time": 1.9529698906478073e+05, - "cpu_time": 4.0728102039107226e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1476542060813515e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3580, - "real_time": 1.9540818919155840e+05, - "cpu_time": 4.0726535977652459e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1464320494205742e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3580, - "real_time": 1.9536171276034534e+05, - "cpu_time": 4.0719118435752578e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1469426842839203e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3580, - "real_time": 1.9538973301779816e+05, - "cpu_time": 4.0723449469274707e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1466347976523098e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3580, - "real_time": 1.9534432617674308e+05, - "cpu_time": 4.0714731452513975e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1471337724982552e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9536019004224514e+05, - "cpu_time": 4.0722387474860199e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1469595019872822e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9536171276034534e+05, - "cpu_time": 4.0723449469274713e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1469426842839203e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3084365458444253e+01, - "cpu_time": 5.4839640176286522e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7352559069515979e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2053810169373600e-04, - "cpu_time": 1.3466705558494470e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2055636832313421e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1819, - "real_time": 3.8495958458446374e+05, - "cpu_time": 7.7346767564598692e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1790879707683861e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1819, - "real_time": 3.8499001426319679e+05, - "cpu_time": 7.7382375810882950e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1789157352702564e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1819, - "real_time": 3.8502598534964857e+05, - "cpu_time": 7.7394118086866266e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1787121698765770e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1819, - "real_time": 3.8486854849079112e+05, - "cpu_time": 7.7340418691590056e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1796034082012596e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1819, - "real_time": 3.8493846753948031e+05, - "cpu_time": 7.7359052281472040e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1792075116887718e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8495652004551614e+05, - "cpu_time": 7.7364546487082005e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1791053591610504e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8495958458446374e+05, - "cpu_time": 7.7359052281472040e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1790879707683861e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9206355008635320e+01, - "cpu_time": 2.3026024342983163e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3516614122073846e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5380010968936162e-04, - "cpu_time": 2.9763018577027330e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5380905737838051e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 919, - "real_time": 7.6215042940658133e+05, - "cpu_time": 1.6119425233949912e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.2012998159776573e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 919, - "real_time": 7.6240522790015128e+05, - "cpu_time": 1.6120480097932799e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.2005641338804192e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 919, - "real_time": 7.6238350789199478e+05, - "cpu_time": 1.6122442002176777e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.2006268270924862e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 919, - "real_time": 7.6211940675013186e+05, - "cpu_time": 1.6119464374319138e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.2013894215792580e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 919, - "real_time": 7.6223639692803100e+05, - "cpu_time": 1.6120471164309755e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.2010515461627941e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6225899377537821e+05, - "cpu_time": 1.6120456574537675e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.2009863489385235e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6223639692803111e+05, - "cpu_time": 1.6120471164309757e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.2010515461627941e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3102438820947913e+02, - "cpu_time": 1.2238069677936983e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7831908317080704e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7188959301159688e-04, - "cpu_time": 7.5916396172469840e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7188615611053661e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 74, - "real_time": 9.3612740244212989e+06, - "cpu_time": 1.8077906013514634e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5843873293810868e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 74, - "real_time": 9.3748179088170473e+06, - "cpu_time": 1.8123592824324347e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5792089325214467e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 74, - "real_time": 9.3550623545574173e+06, - "cpu_time": 1.8091651689188268e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5867673274944663e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 74, - "real_time": 9.3599856403228398e+06, - "cpu_time": 1.8095470540540215e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5848807134326606e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 74, - "real_time": 9.3643639010150693e+06, - "cpu_time": 1.8093864486486934e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5832046206964254e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3631007658267356e+06, - "cpu_time": 1.8096497110810880e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5836897847052174e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3612740244213007e+06, - "cpu_time": 1.8093864486486934e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5843873293810868e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3577169878505474e+03, - "cpu_time": 1.6667852721352610e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8146744857620746e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8582054939583699e-04, - "cpu_time": 9.2105409236327863e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8541242542108051e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 38, - "real_time": 1.8419302068650723e+07, - "cpu_time": 3.5537425105264664e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6433988513722200e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 38, - "real_time": 1.8458653584514793e+07, - "cpu_time": 3.5570271421052344e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6356315856265111e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 38, - "real_time": 1.8418413586914539e+07, - "cpu_time": 3.5537764947369061e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6435746044750485e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 38, - "real_time": 1.8412981917591471e+07, - "cpu_time": 3.5534613605265304e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6446494272546511e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 38, - "real_time": 1.8424847065226030e+07, - "cpu_time": 3.5521832026317589e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6423023628053513e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8426839644579507e+07, - "cpu_time": 3.5540381421053790e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6419113663067570e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8419302068650723e+07, - "cpu_time": 3.5537425105264656e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6433988513722200e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8275306036510199e+04, - "cpu_time": 1.7932830099102568e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6077858313375534e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.9177647328613466e-04, - "cpu_time": 5.0457618579409307e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9062977334239471e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.6598808083095051e+07, - "cpu_time": 6.9663168526319981e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6672704667121396e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.6457208230307229e+07, - "cpu_time": 6.9578491789475024e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6815141508400941e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.6526706461843692e+07, - "cpu_time": 6.9617895789472058e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6745094480446987e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.6565132243068598e+07, - "cpu_time": 6.9618660421054438e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6706479579447646e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.6565789070568584e+07, - "cpu_time": 6.9625199210523337e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6705820224738545e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6542728817776628e+07, - "cpu_time": 6.9620683147368982e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6729048092031107e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6565132243068591e+07, - "cpu_time": 6.9618660421054453e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6706479579447646e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4196539310825450e+04, - "cpu_time": 3.0072303343736323e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4527552742297174e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4831004980794134e-03, - "cpu_time": 4.3194496210387695e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4845893257475330e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.2198604544003800e+07, - "cpu_time": 1.3463926144445142e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7180144643431883e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.2325127820173904e+07, - "cpu_time": 1.3488845300000522e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7115102882006159e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.2395864460203379e+07, - "cpu_time": 1.3493584122222221e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7078838411766081e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.2128612962034017e+07, - "cpu_time": 1.3469525688889110e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7216223212457318e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.2319990230931178e+07, - "cpu_time": 1.3481021288888919e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7117739527181306e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2273640003469259e+07, - "cpu_time": 1.3479380508889183e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7141609735368557e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2319990230931178e+07, - "cpu_time": 1.3481021288888922e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7117739527181306e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0770482765103337e+05, - "cpu_time": 1.2549620703551706e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5373164261400122e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4902366567653620e-03, - "cpu_time": 9.3102355076894413e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4908660301998257e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4213614761829376e+08, - "cpu_time": 2.5752856340000111e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7771595825276294e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4226868748664856e+08, - "cpu_time": 2.5751518540000686e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7736407180278764e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4186769723892212e+08, - "cpu_time": 2.5715299140001661e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7843069454764276e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4195057749748230e+08, - "cpu_time": 2.5718503260000032e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7820974135136728e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4215550720691681e+08, - "cpu_time": 2.5746969940000781e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7766451863067718e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4207572340965271e+08, - "cpu_time": 2.5737029444000655e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7787699691704750e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4213614761829376e+08, - "cpu_time": 2.5746969940000781e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7771595825276294e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6293254842418112e+05, - "cpu_time": 1.8538228108514953e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3343758818081291e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1468007659154484e-03, - "cpu_time": 7.2029400863261807e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1470335366192247e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8616939485073090e+08, - "cpu_time": 4.5253928500000030e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7521197001519871e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8567315638065338e+08, - "cpu_time": 4.5243155349999142e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7586374498878779e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8522068262100220e+08, - "cpu_time": 4.5172099050000727e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7646001479730530e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8617884218692780e+08, - "cpu_time": 4.5270892549996233e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7519958351730547e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8556868433952332e+08, - "cpu_time": 4.5217475999999124e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7600125044642081e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8576215207576758e+08, - "cpu_time": 4.5231510289999044e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7574731275300364e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8567315638065338e+08, - "cpu_time": 4.5243155349999142e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7586374498878779e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1170878530419740e+05, - "cpu_time": 3.8457127745416330e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4142963165013418e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4407393782331121e-03, - "cpu_time": 8.5022869010676000e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4409407952467282e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 91783, - "real_time": 7.5923980512014004e+03, - "cpu_time": 1.4786970615474365e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3717937109407909e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 91783, - "real_time": 7.6584969569509794e+03, - "cpu_time": 1.4824515411351462e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3426924556998111e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 91783, - "real_time": 7.5879229917254970e+03, - "cpu_time": 1.4767249163788101e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3737822626714021e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 91783, - "real_time": 7.5960768989545204e+03, - "cpu_time": 1.4721806293103673e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3701607211906232e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 91783, - "real_time": 7.5379840775250505e+03, - "cpu_time": 1.4655962574768371e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3961334670801342e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5945757952714903e+03, - "cpu_time": 1.4751300811697194e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3709125235165529e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5923980512013995e+03, - "cpu_time": 1.4767249163788099e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.3717937109407909e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2836296246402732e+01, - "cpu_time": 6.4896780517512781e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8987135925574714e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.6403803716164533e-03, - "cpu_time": 4.3993937447233270e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6326397653793875e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 82564, - "real_time": 8.5243028405770074e+03, - "cpu_time": 1.5680613027470783e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.0063562918342173e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 82564, - "real_time": 8.5333426629340374e+03, - "cpu_time": 1.5682481154014013e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 5.9999934401316769e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 82564, - "real_time": 8.5090498630299353e+03, - "cpu_time": 1.5671417203624424e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.0171230424272671e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 82564, - "real_time": 8.4929010304256772e+03, - "cpu_time": 1.5650012426722426e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.0285643052446805e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 82564, - "real_time": 8.5640414032171648e+03, - "cpu_time": 1.5729501538199478e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 5.9784858093710549e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5247275600367648e+03, - "cpu_time": 1.5682805070006225e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.0061045778017797e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5243028405770056e+03, - "cpu_time": 1.5680613027470783e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.0063562918342173e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6826744214569420e+01, - "cpu_time": 2.9114047588309035e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8881549543800688e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1469327348748401e-03, - "cpu_time": 1.8564311332282270e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1437264035637708e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 75948, - "real_time": 9.1239547725872835e+03, - "cpu_time": 1.6229336848896557e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1223203375323439e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 75948, - "real_time": 9.2018511671705219e+03, - "cpu_time": 1.6321887054299686e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1128195635823023e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 75948, - "real_time": 9.1047662517047211e+03, - "cpu_time": 1.6223212882498357e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1246856555029872e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 75948, - "real_time": 9.2213314853955744e+03, - "cpu_time": 1.6365415521146744e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1104687014253590e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 75948, - "real_time": 9.1170019919724782e+03, - "cpu_time": 1.6219230196976803e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1231762380897054e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1537811337661169e+03, - "cpu_time": 1.6271816500763631e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1186940992265397e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1239547725872853e+03, - "cpu_time": 1.6229336848896559e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1223203375323439e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3662262979755198e+01, - "cpu_time": 6.7453667108504703e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5441817226067313e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8623056631546397e-03, - "cpu_time": 4.1454294365560924e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8498402084460359e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72236, - "real_time": 9.6744130111051436e+03, - "cpu_time": 1.6824468076857975e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1169243008843276e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72236, - "real_time": 9.6861891293785757e+03, - "cpu_time": 1.6841550764162268e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1143506209148228e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72236, - "real_time": 9.6687236179641059e+03, - "cpu_time": 1.6822142851209464e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1181699683657283e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72236, - "real_time": 9.6941251841420562e+03, - "cpu_time": 1.6869614624286507e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1126197166817904e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72236, - "real_time": 9.6829637312608502e+03, - "cpu_time": 1.6839298479981593e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1150549117396346e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6812829347701481e+03, - "cpu_time": 1.6839414959299564e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1154239037172607e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6829637312608502e+03, - "cpu_time": 1.6839298479981597e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1150549117396346e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9593107328214874e+00, - "cpu_time": 1.8962660729620438e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1762133797033783e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0287180738260222e-03, - "cpu_time": 1.1260878584827742e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0287363094835496e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 68493, - "real_time": 1.0208763676736826e+04, - "cpu_time": 1.7477120245864146e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0122390229619497e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 68493, - "real_time": 1.0215654381183149e+04, - "cpu_time": 1.7493793803746958e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0095326712938505e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 68493, - "real_time": 1.0209085721702661e+04, - "cpu_time": 1.7478938592263916e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0121124571347743e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 68493, - "real_time": 1.0216581703032745e+04, - "cpu_time": 1.7521363058997777e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0091687406406403e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 68493, - "real_time": 1.0211136029019282e+04, - "cpu_time": 1.7478622924969834e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0113068598434836e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0212244302334931e+04, - "cpu_time": 1.7489967725168524e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0108719503749394e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0211136029019282e+04, - "cpu_time": 1.7478938592263912e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0113068598434836e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6661061923381135e+00, - "cpu_time": 1.8812959975942682e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4397467318941897e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5899123481602304e-04, - "cpu_time": 1.0756429212199368e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5896103134372095e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 62335, - "real_time": 1.1223134919809392e+04, - "cpu_time": 1.8658727183766001e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2992083393212271e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 62335, - "real_time": 1.1232821867586819e+04, - "cpu_time": 1.8673726830834181e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2929136565751600e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 62335, - "real_time": 1.1225026283266045e+04, - "cpu_time": 1.8661425924440005e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2979784574869144e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 62335, - "real_time": 1.1233271036562493e+04, - "cpu_time": 1.8660965444773887e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2926220451161158e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 62335, - "real_time": 1.1229423278144441e+04, - "cpu_time": 1.8682438774364105e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2951208598075509e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1228735477073838e+04, - "cpu_time": 1.8667456831635638e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2955686716613948e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1229423278144441e+04, - "cpu_time": 1.8661425924440009e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2951208598075509e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5515743952775605e+00, - "cpu_time": 1.0228492004306862e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9574692275660281e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0535057616867843e-04, - "cpu_time": 5.4793173470596673e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0537884854047076e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 62072, - "real_time": 1.1247184257777682e+04, - "cpu_time": 1.9096152017013759e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4567201554175742e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 62072, - "real_time": 1.1262147826598448e+04, - "cpu_time": 1.9143199590798682e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4547846691645253e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 62072, - "real_time": 1.1246764502690383e+04, - "cpu_time": 1.9100091619409952e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4567745235601509e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 62072, - "real_time": 1.1257229778878465e+04, - "cpu_time": 1.9162205148859357e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4554202340917575e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 62072, - "real_time": 1.1288810652778753e+04, - "cpu_time": 1.9433319709368508e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4513486410516648e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1260427403744749e+04, - "cpu_time": 1.9186993617090055e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4550096446571348e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1257229778878467e+04, - "cpu_time": 1.9143199590798682e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4554202340917575e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7181743694819026e+01, - "cpu_time": 1.4054632878358422e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2171372113786736e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5258518241594540e-03, - "cpu_time": 7.3250834178835685e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5237955428818687e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 61562, - "real_time": 1.1369005053107738e+04, - "cpu_time": 1.9774632240668143e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8822223094221258e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 61562, - "real_time": 1.1377600759334075e+04, - "cpu_time": 1.9794923215620282e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8800448084907045e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 61562, - "real_time": 1.1370734886516437e+04, - "cpu_time": 1.9761566420844516e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8817838360523834e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 61562, - "real_time": 1.1379389022687845e+04, - "cpu_time": 1.9804226747019682e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8795922113804407e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 61562, - "real_time": 1.1366646229609305e+04, - "cpu_time": 1.9758022855007897e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8828204325249157e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1372675190251080e+04, - "cpu_time": 1.9778674295832105e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8812927195741138e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1370734886516437e+04, - "cpu_time": 1.9774632240668147e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.8817838360523834e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5434607521911818e+00, - "cpu_time": 2.0325198403427230e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4043014044570345e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.8743683077691021e-04, - "cpu_time": 1.0276319888492369e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8738588582718017e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 53687, - "real_time": 1.2973473578859910e+04, - "cpu_time": 2.3630541080708277e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.0515384026981001e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 53687, - "real_time": 1.2963155936503001e+04, - "cpu_time": 2.3508846368765833e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.0555590259820080e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 53687, - "real_time": 1.2968184359236460e+04, - "cpu_time": 2.3587246428373910e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.0535987293643484e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 53687, - "real_time": 1.2962918396991905e+04, - "cpu_time": 2.3587174772290877e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.0556516667734232e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 53687, - "real_time": 1.2967700417812075e+04, - "cpu_time": 2.3585706875034135e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.0537873245422573e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2967086537880670e+04, - "cpu_time": 2.3579903105034606e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.0540270298720274e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2967700417812073e+04, - "cpu_time": 2.3587174772290877e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.0537873245422573e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3358787621626611e+00, - "cpu_time": 4.4027689120561533e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6897205638803120e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.3437570957024814e-04, - "cpu_time": 1.8671700610661571e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3433152491926766e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 42944, - "real_time": 1.6294955778623149e+04, - "cpu_time": 3.0069813175298346e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.0437162138205557e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 42944, - "real_time": 1.6301689182704848e+04, - "cpu_time": 3.0092493340162917e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.0403937610993004e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 42944, - "real_time": 1.6298726765312149e+04, - "cpu_time": 3.0073880053092304e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.0418551637392111e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 42944, - "real_time": 1.6302179006003180e+04, - "cpu_time": 3.0092999813709248e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.0401521754689064e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 42944, - "real_time": 1.6299976856715286e+04, - "cpu_time": 3.0079511410206327e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.0412384110840492e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6299505517871725e+04, - "cpu_time": 3.0081739558493828e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.0414711450424042e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6299976856715288e+04, - "cpu_time": 3.0079511410206331e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.0412384110840492e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8915685180226349e+00, - "cpu_time": 1.0623232249577059e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4267450934206853e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7740222332831822e-04, - "cpu_time": 3.5314554296038045e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7742339277064729e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 30062, - "real_time": 2.3288759653339177e+04, - "cpu_time": 4.4717244228594172e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1256245669674959e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 30062, - "real_time": 2.3287221232976557e+04, - "cpu_time": 4.4725253742265653e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1256989289421240e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 30062, - "real_time": 2.3286649847574150e+04, - "cpu_time": 4.4711716585725379e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1257265502590466e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 30062, - "real_time": 2.3293258492570352e+04, - "cpu_time": 4.4959774133458297e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1254071648396200e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 30062, - "real_time": 2.3290073775039375e+04, - "cpu_time": 4.4952200219546852e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1255610546023563e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3289192600299924e+04, - "cpu_time": 4.4813237781918069e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1256036531221287e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3288759653339177e+04, - "cpu_time": 4.4725253742265646e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1256245669674959e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6385257307126908e+00, - "cpu_time": 1.3042811064521840e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2751554320944564e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1329399760637091e-04, - "cpu_time": 2.9104817482713901e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1328636226059771e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18985, - "real_time": 3.6873701609222742e+04, - "cpu_time": 7.0968545325261875e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4218480302201788e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18985, - "real_time": 3.6868881158148877e+04, - "cpu_time": 7.0912487542793271e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4220339308672518e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18985, - "real_time": 3.6870803435873975e+04, - "cpu_time": 7.0912357176716177e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4219597924190784e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18985, - "real_time": 3.6871383929861724e+04, - "cpu_time": 7.0957961285228463e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4219374054343128e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18985, - "real_time": 3.6872826450640678e+04, - "cpu_time": 7.0893910192259951e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4218817770908646e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6871519316749604e+04, - "cpu_time": 7.0929052304451965e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4219321872063374e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6871383929861724e+04, - "cpu_time": 7.0912487542793286e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4219374054343128e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8682675789805885e+00, - "cpu_time": 3.2340046843080103e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2049683835531154e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0669666279032108e-05, - "cpu_time": 4.5594923084923598e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0670267178554266e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10837, - "real_time": 6.4523350905901680e+04, - "cpu_time": 1.2367614395127280e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6251108866450569e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10837, - "real_time": 6.4507258530728126e+04, - "cpu_time": 1.2359432776598584e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6255162967443567e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10837, - "real_time": 6.4518034257524712e+04, - "cpu_time": 1.2372912245086118e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6252448049092646e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10837, - "real_time": 6.4507214654091971e+04, - "cpu_time": 1.2362346691888115e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6255174023910275e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10837, - "real_time": 6.4502063084752233e+04, - "cpu_time": 1.2368965368645072e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6256472271626841e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4511584286599747e+04, - "cpu_time": 1.2366254295469033e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6254073235704781e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4507258530728126e+04, - "cpu_time": 1.2367614395127280e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.6255162967443567e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7822917633408224e+00, - "cpu_time": 5.3696035086361874e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2126533689667708e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3613511217341269e-04, - "cpu_time": 4.3421422367188395e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3612916201868151e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6575, - "real_time": 1.0643200717331706e+05, - "cpu_time": 2.1790994479087144e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9704147800059196e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6575, - "real_time": 1.0654270342757444e+05, - "cpu_time": 2.1807829566539731e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9683675489101902e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6575, - "real_time": 1.0645414954679929e+05, - "cpu_time": 2.1796624045627739e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9700049353905659e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6575, - "real_time": 1.0638523559588868e+05, - "cpu_time": 2.1797718737642313e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9712810600581551e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6575, - "real_time": 1.0656441413924034e+05, - "cpu_time": 2.1808647528517214e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9679665270432552e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0647570197656397e+05, - "cpu_time": 2.1800362871482829e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9696069702816174e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0645414954679928e+05, - "cpu_time": 2.1797718737642313e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9700049353905659e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5691728956130220e+01, - "cpu_time": 7.6342012783483426e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4000650616927773e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1088264788139656e-04, - "cpu_time": 3.5018689016111203e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1083474155891814e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3450, - "real_time": 2.0319172511876060e+05, - "cpu_time": 4.1600277536229871e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0642100447488850e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3450, - "real_time": 2.0330233220179714e+05, - "cpu_time": 4.1604464550725120e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0630870067131100e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3450, - "real_time": 2.0315827779046705e+05, - "cpu_time": 4.1587395130433002e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0645498896805534e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3450, - "real_time": 2.0335579425538552e+05, - "cpu_time": 4.1617368434779806e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0625446230130821e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3450, - "real_time": 2.0328221395544277e+05, - "cpu_time": 4.1619001681158191e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0632911844020676e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0325806866437063e+05, - "cpu_time": 4.1605701466665207e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0635365497115398e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0328221395544274e+05, - "cpu_time": 4.1604464550725126e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0632911844020676e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.1320710035706171e+01, - "cpu_time": 1.3029627537495247e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2563083006002139e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0008601168983255e-04, - "cpu_time": 3.1316927916561345e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0010477651846566e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1758, - "real_time": 3.9843334119758476e+05, - "cpu_time": 7.8810194766782736e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1053981011694637e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1758, - "real_time": 3.9865742719971150e+05, - "cpu_time": 7.8816324573379464e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1042146533990551e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1758, - "real_time": 3.9851444176929572e+05, - "cpu_time": 7.8852415585888969e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1049696374256508e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1758, - "real_time": 3.9834716356363660e+05, - "cpu_time": 7.8788444084185991e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1058535788117661e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1758, - "real_time": 3.9849624050192040e+05, - "cpu_time": 7.8807651934014168e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1050657816581272e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9848972284642980e+05, - "cpu_time": 7.8815006188850279e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1051003504928127e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9849624050192034e+05, - "cpu_time": 7.8810194766782748e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.1050657816581272e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1432442255181756e+02, - "cpu_time": 2.3366543220923387e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0389332962171389e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8689428107503786e-04, - "cpu_time": 2.9647327775289805e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8687151635328924e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 888, - "real_time": 7.8820547623599693e+05, - "cpu_time": 1.6424407364865032e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1285332956728569e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 888, - "real_time": 7.8858043825430039e+05, - "cpu_time": 1.6427606497747879e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1275211996305828e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 888, - "real_time": 7.8816224138151750e+05, - "cpu_time": 1.6423926283783836e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1286500569466923e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 888, - "real_time": 7.8842152412959829e+05, - "cpu_time": 1.6425930608107564e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1279500224859684e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 888, - "real_time": 7.8826909078555682e+05, - "cpu_time": 1.6430012916666905e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1283615197039516e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8832775415739394e+05, - "cpu_time": 1.6426376734234241e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1282032188880104e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8826909078555682e+05, - "cpu_time": 1.6425930608107564e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1283615197039516e+10, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7206817003619375e+02, - "cpu_time": 2.4907976792231926e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6447087257997133e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1826983653532438e-04, - "cpu_time": 1.5163402858234197e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1824554556526708e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 75, - "real_time": 9.2386158431569729e+06, - "cpu_time": 1.7337691506666791e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6319761065564499e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 75, - "real_time": 9.2473860209186878e+06, - "cpu_time": 1.7337267080000252e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6285315573607378e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 75, - "real_time": 9.2384388421972599e+06, - "cpu_time": 1.7340170253334388e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6320456922589159e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 75, - "real_time": 9.2299758767088261e+06, - "cpu_time": 1.7333297093333993e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6353759151930370e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 75, - "real_time": 9.2267630249261856e+06, - "cpu_time": 1.7323669146667272e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6366417896885824e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2362359215815868e+06, - "cpu_time": 1.7334419016000539e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6329142122115450e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2384388421972580e+06, - "cpu_time": 1.7337267080000248e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6320456922589159e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.1204300056742095e+03, - "cpu_time": 6.4945322368503530e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1936205189721584e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7919257093680748e-04, - "cpu_time": 3.7466108502716894e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7907953021220243e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 37, - "real_time": 1.8606612207116306e+07, - "cpu_time": 3.4680258432432756e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6067212694599752e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 37, - "real_time": 1.8667667600754146e+07, - "cpu_time": 3.4752377324323520e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5949249491290975e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 37, - "real_time": 1.8621410268384058e+07, - "cpu_time": 3.4668845594594769e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6038550804038339e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 37, - "real_time": 1.8614270799868815e+07, - "cpu_time": 3.4697742513513558e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6052373322339840e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 37, - "real_time": 1.8664117751492035e+07, - "cpu_time": 3.4759535891892582e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5956086911547275e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8634815725523073e+07, - "cpu_time": 3.4711751951351449e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6012694644763241e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8621410268384058e+07, - "cpu_time": 3.4697742513513565e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6038550804038339e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8875132613586797e+04, - "cpu_time": 4.1721659346541899e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5778309274053834e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5495260612659633e-03, - "cpu_time": 1.2019462286148753e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5488513099134278e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.7261665651672766e+07, - "cpu_time": 6.8825946736847311e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6020324280370607e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.7337673926039748e+07, - "cpu_time": 6.8817045947370335e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5946997733673744e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.7390322473488353e+07, - "cpu_time": 6.8865885263155743e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5896381502236900e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.7298886203452162e+07, - "cpu_time": 6.8871071578948766e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5984379605302429e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.7385581159277968e+07, - "cpu_time": 6.8931284157895923e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5900933953166924e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7334825882786199e+07, - "cpu_time": 6.8862246736843616e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5949803414950123e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7337673926039740e+07, - "cpu_time": 6.8865885263155743e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5946997733673744e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5471075768795949e+04, - "cpu_time": 4.5326823143537229e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3429164084645752e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4857729869411753e-03, - "cpu_time": 6.5822457574980417e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4862157511110795e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.4127174086040914e+07, - "cpu_time": 1.3444352444443870e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6212827388836040e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.4312290383709803e+07, - "cpu_time": 1.3474003533332911e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6122619100277991e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.4273020856910288e+07, - "cpu_time": 1.3463885966666567e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6141717800485163e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.4104344679249659e+07, - "cpu_time": 1.3446170922222537e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6223983514311543e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.4213022987047836e+07, - "cpu_time": 1.3457162077778170e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6170936743386564e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4205970598591700e+07, - "cpu_time": 1.3457114988888812e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6174416909459457e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4213022987047836e+07, - "cpu_time": 1.3457162077778170e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6170936743386564e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9980675563218174e+04, - "cpu_time": 1.2386751256318674e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3865047487036875e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2125799964258651e-03, - "cpu_time": 9.2046112904185567e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2125986051641472e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4729973971843719e+08, - "cpu_time": 2.5913016959998459e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6447512604314604e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4730197787284851e+08, - "cpu_time": 2.5905497880000892e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6446958808891792e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4741483926773071e+08, - "cpu_time": 2.5921910459999251e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6419054870381808e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4721653461456299e+08, - "cpu_time": 2.5905152539999110e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6468112322139359e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4739173948764801e+08, - "cpu_time": 2.5921878899998775e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6424762599737949e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4732496619224548e+08, - "cpu_time": 2.5913491347999302e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6441280241093102e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4730197787284851e+08, - "cpu_time": 2.5913016959998459e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6446958808891792e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9777953572336351e+04, - "cpu_time": 8.2898849236959068e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9734795650322807e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4151007554438188e-04, - "cpu_time": 3.1990613740035239e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4155055804183346e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.9853375256061554e+08, - "cpu_time": 4.6241900799998349e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.5967183435379992e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.9657407104969025e+08, - "cpu_time": 4.6094724450000513e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6204844887471542e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.9677063226699829e+08, - "cpu_time": 4.6224333050002998e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6180865195380149e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.9662142693996429e+08, - "cpu_time": 4.6227890649998927e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6199064749874716e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.9631565511226654e+08, - "cpu_time": 4.6259104050000131e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6236419017185788e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9696310758590698e+08, - "cpu_time": 4.6209590600000179e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6157675457058434e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9662142693996429e+08, - "cpu_time": 4.6227890649998921e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6199064749874716e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9320520891080773e+05, - "cpu_time": 6.5654388342783810e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0835537743466172e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0077985651884953e-03, - "cpu_time": 1.4207957155712944e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9967462251091529e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 97018, - "real_time": 7.2145366791511142e+03, - "cpu_time": 1.4377992321012642e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5483914128512241e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 97018, - "real_time": 7.1952725558306820e+03, - "cpu_time": 1.4307121523841915e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5578916297277808e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 97018, - "real_time": 7.2089905747271996e+03, - "cpu_time": 1.4355525799336847e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5511213025783084e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 97018, - "real_time": 7.2069935178610458e+03, - "cpu_time": 1.4329728266919368e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5521053177799709e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 97018, - "real_time": 7.1957065286691068e+03, - "cpu_time": 1.4362926343564999e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5576770533935167e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2042999712478313e+03, - "cpu_time": 1.4346658850935153e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5534373432661600e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2069935178610449e+03, - "cpu_time": 1.4355525799336847e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5521053177799709e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5057131900412646e+00, - "cpu_time": 2.8173060476456715e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1956989875049425e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1806439520824143e-03, - "cpu_time": 1.9637366978040548e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1807437650352502e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 95384, - "real_time": 7.3598769254035751e+03, - "cpu_time": 1.4539557797953770e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9566380686715737e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 95384, - "real_time": 7.3229799188308334e+03, - "cpu_time": 1.4457065367357845e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9916892532151654e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 95384, - "real_time": 7.3494950375187582e+03, - "cpu_time": 1.4529646984818257e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9664650072728649e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 95384, - "real_time": 7.3283983569817146e+03, - "cpu_time": 1.4476282835695951e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9865197695240065e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 95384, - "real_time": 7.3507399960669318e+03, - "cpu_time": 1.4527842436887415e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9652851314826727e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3422980469603617e+03, - "cpu_time": 1.4506079084542649e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9733194460332572e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3494950375187591e+03, - "cpu_time": 1.4527842436887415e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9664650072728649e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5799300626050371e+01, - "cpu_time": 3.6878430680896713e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5012496859699921e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1518195699766129e-03, - "cpu_time": 2.5422742055910574e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1528480052982108e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 92657, - "real_time": 7.5127615273428737e+03, - "cpu_time": 1.4685678491641302e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3630141144146898e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 92657, - "real_time": 7.5549063548937875e+03, - "cpu_time": 1.4668269164768770e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3554105794265616e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 92657, - "real_time": 7.5113514447626922e+03, - "cpu_time": 1.4682887812038414e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3632699888033950e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 92657, - "real_time": 7.5520748253881966e+03, - "cpu_time": 1.4667983606203647e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3559187689157513e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 92657, - "real_time": 7.5122611086873912e+03, - "cpu_time": 1.4654900212612038e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3631049096733573e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5286710522149897e+03, - "cpu_time": 1.4671943857452832e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3601436722467509e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5127615273428728e+03, - "cpu_time": 1.4668269164768770e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3630141144146898e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2684773174356703e+01, - "cpu_time": 1.2530793110666085e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0937206899714103e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0131178553328719e-03, - "cpu_time": 8.5406495774592833e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0097707863531837e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 90003, - "real_time": 7.7876028618832161e+03, - "cpu_time": 1.5059769774340914e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6298208014998186e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 90003, - "real_time": 7.7761520992028200e+03, - "cpu_time": 1.4989882803906759e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6336933407076138e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 90003, - "real_time": 7.7875956039279436e+03, - "cpu_time": 1.5039887581525423e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6298232524644965e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 90003, - "real_time": 7.7724740230052439e+03, - "cpu_time": 1.4983123018121594e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6349396523401135e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 90003, - "real_time": 7.7852063519031144e+03, - "cpu_time": 1.5023454418186435e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6306303358283636e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7818061879844699e+03, - "cpu_time": 1.5019223519216224e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6317814765680814e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7852063519031162e+03, - "cpu_time": 1.5023454418186437e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6306303358283636e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0309654918993143e+00, - "cpu_time": 3.2607616196957856e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3787240306517272e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.0351331324024840e-04, - "cpu_time": 2.1710587205282820e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0384557070203708e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 81175, - "real_time": 8.6338694556105329e+03, - "cpu_time": 1.5923093698799885e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7441069396043539e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 81175, - "real_time": 8.6208047094362064e+03, - "cpu_time": 1.5847261915613570e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7512965877960074e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 81175, - "real_time": 8.6349262151790281e+03, - "cpu_time": 1.5915573600245762e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7435263462932527e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 81175, - "real_time": 8.6219504554340638e+03, - "cpu_time": 1.5858100597475528e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7506652017681903e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 81175, - "real_time": 8.6329860749077343e+03, - "cpu_time": 1.5911632719433961e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7445923860635632e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6289073821135134e+03, - "cpu_time": 1.5891132506313743e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7468374923050737e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6329860749077361e+03, - "cpu_time": 1.5911632719433959e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7445923860635632e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9198336882069187e+00, - "cpu_time": 3.5548837411532155e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8077224273835926e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0193625702261451e-04, - "cpu_time": 2.2370235348178088e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0215984506656348e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65618, - "real_time": 1.0676522894001089e+04, - "cpu_time": 1.8177006492121309e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6729100675678885e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65618, - "real_time": 1.0670416829326472e+04, - "cpu_time": 1.8117103995854552e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6773008318524039e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65618, - "real_time": 1.0676091654852553e+04, - "cpu_time": 1.8210781630038840e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6732199992649269e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65618, - "real_time": 1.0669074271205927e+04, - "cpu_time": 1.8147692157639362e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6782669159112108e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65618, - "real_time": 1.0676023244462389e+04, - "cpu_time": 1.8209741397176789e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6732691681325793e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0673625778769685e+04, - "cpu_time": 1.8172465134566170e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6749933965458012e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0676023244462389e+04, - "cpu_time": 1.8177006492121305e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6732691681325793e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5789398188896122e+00, - "cpu_time": 4.0487200363975049e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5738273011218139e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.3530684821349852e-04, - "cpu_time": 2.2279421126506177e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3535237988350423e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65679, - "real_time": 1.0660178189750946e+04, - "cpu_time": 1.8535354572998836e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5369349093762922e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65679, - "real_time": 1.0655615225835336e+04, - "cpu_time": 1.8486369143865635e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5375930580034239e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65679, - "real_time": 1.0663420382688360e+04, - "cpu_time": 1.8548009287595039e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5364676072040424e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65679, - "real_time": 1.0657330279667714e+04, - "cpu_time": 1.8490374899130595e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5373456175284114e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65679, - "real_time": 1.0669393446720214e+04, - "cpu_time": 1.8547911813515751e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5356074440235832e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0661187504932515e+04, - "cpu_time": 1.8521603943421174e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5367897272271507e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0660178189750946e+04, - "cpu_time": 1.8535354572998833e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5369349093762922e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4605499263941457e+00, - "cpu_time": 3.0802476971348455e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8692234371632885e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.1218965278190267e-04, - "cpu_time": 1.6630566696838054e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1205596300814868e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65106, - "real_time": 1.0742469683062278e+04, - "cpu_time": 1.9353042407766305e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0503227811445928e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65106, - "real_time": 1.0749193568507919e+04, - "cpu_time": 1.9302959066753072e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0484147290826473e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65106, - "real_time": 1.0743546262429025e+04, - "cpu_time": 1.9369520950450435e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0500171172150216e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65106, - "real_time": 1.0748443778762436e+04, - "cpu_time": 1.9299814441063652e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0486273803418331e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65106, - "real_time": 1.0740742514654659e+04, - "cpu_time": 1.9348023315822444e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0508132892387443e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0744879161483264e+04, - "cpu_time": 1.9334672036371187e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0496390594045677e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0743546262429027e+04, - "cpu_time": 1.9348023315822444e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0500171172150216e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7421470233312051e+00, - "cpu_time": 3.1428245308455423e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0620379105851166e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4827260196145605e-04, - "cpu_time": 1.6254863412906388e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4825036337004291e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 55795, - "real_time": 1.2549369167846811e+04, - "cpu_time": 2.2698727574153650e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2222545311609879e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 55795, - "real_time": 1.2534709495565552e+04, - "cpu_time": 2.2642396272066195e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2283620951235371e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 55795, - "real_time": 1.2553059914788299e+04, - "cpu_time": 2.2674191898914803e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2207191270388546e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 55795, - "real_time": 1.2545810182864210e+04, - "cpu_time": 2.2647599874540341e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2237359759764938e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 55795, - "real_time": 1.2540127161509992e+04, - "cpu_time": 2.2662114418856359e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2261033046899843e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2544615184514971e+04, - "cpu_time": 2.2665006007706270e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2242350067979717e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2545810182864208e+04, - "cpu_time": 2.2662114418856359e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2237359759764938e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3076479117181874e+00, - "cpu_time": 2.2605638371798808e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0436869515769850e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8253264880844834e-04, - "cpu_time": 9.9738064768713154e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8260911839081223e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 46496, - "real_time": 1.5064143676076252e+04, - "cpu_time": 2.8215804370268692e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7009260412298622e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 46496, - "real_time": 1.5059443572256458e+04, - "cpu_time": 2.8217820350136863e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7036416299915524e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 46496, - "real_time": 1.5064087967569696e+04, - "cpu_time": 2.8231086609600770e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7009582181260967e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 46496, - "real_time": 1.5062848533263037e+04, - "cpu_time": 2.8233070285616599e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7016741694345455e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 46496, - "real_time": 1.5068020716199471e+04, - "cpu_time": 2.8253374612871838e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6986872707897110e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5063708893072984e+04, - "cpu_time": 2.8230231245698953e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7011774659143543e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5064087967569698e+04, - "cpu_time": 2.8231086609600763e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7009582181260967e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0764318956120671e+00, - "cpu_time": 1.5054669555125907e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7770181960576542e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0422805017340437e-04, - "cpu_time": 5.3328183620244261e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0422732475218147e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33059, - "real_time": 2.1176531446141784e+04, - "cpu_time": 4.2650729513901118e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2378986646926109e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33059, - "real_time": 2.1174944018122460e+04, - "cpu_time": 4.2657680782842144e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2379914665920509e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33059, - "real_time": 2.1176994922760037e+04, - "cpu_time": 4.2663657400403237e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2378715722232145e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33059, - "real_time": 2.1176603552820736e+04, - "cpu_time": 4.2665284461114359e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2378944496275574e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33059, - "real_time": 2.1175699301379715e+04, - "cpu_time": 4.2637030702680931e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2379473105897375e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1176154648244948e+04, - "cpu_time": 4.2654876572188354e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2379206927450344e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1176531446141784e+04, - "cpu_time": 4.2657680782842144e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.2378986646926109e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2500282764971655e-01, - "cpu_time": 1.1499606997247110e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8229161767544749e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8959048106408299e-05, - "cpu_time": 2.6959653670044926e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8959815479454272e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19288, - "real_time": 3.6289626697514730e+04, - "cpu_time": 6.9583070458320639e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4447324144998863e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19288, - "real_time": 3.6293947589902440e+04, - "cpu_time": 6.9628477602658735e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4445604152078112e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19288, - "real_time": 3.6292081974089255e+04, - "cpu_time": 6.9605354572793411e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4446346736853388e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19288, - "real_time": 3.6292099104352179e+04, - "cpu_time": 6.9617923786807543e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4446339918021631e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19288, - "real_time": 3.6290413370822920e+04, - "cpu_time": 6.9640104002485590e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4447010967957771e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6291633747336309e+04, - "cpu_time": 6.9614986084613178e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4446525183981953e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6292081974089262e+04, - "cpu_time": 6.9617923786807543e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4446346736853388e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6799478611697036e+00, - "cpu_time": 2.1982573609718955e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6872852441031707e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6290224156497399e-05, - "cpu_time": 3.1577358333448991e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6289922032724602e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 12188, - "real_time": 5.7400847059415391e+04, - "cpu_time": 1.1851160067279437e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8267604986989532e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 12188, - "real_time": 5.7412725952104411e+04, - "cpu_time": 1.1850714038398454e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8263825355980423e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 12188, - "real_time": 5.7404522219153900e+04, - "cpu_time": 1.1845747710863144e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8266435456022778e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 12188, - "real_time": 5.7389702975762790e+04, - "cpu_time": 1.1850016467016531e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8271152238631413e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 12188, - "real_time": 5.7400490456303400e+04, - "cpu_time": 1.1850683705283824e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8267718475301830e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.7401657732547981e+04, - "cpu_time": 1.1849664397768278e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8267347302585197e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.7400847059415384e+04, - "cpu_time": 1.1850683705283822e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8267604986989532e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3013055762699768e+00, - "cpu_time": 2.2272263919604274e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6418402933712704e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4461787175116647e-04, - "cpu_time": 1.8795691736045241e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4462090470012561e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6586, - "real_time": 1.0655593149164926e+05, - "cpu_time": 2.1899720376555889e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9681231918697582e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6586, - "real_time": 1.0650824078114354e+05, - "cpu_time": 2.1888982645004280e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9690044494390751e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6586, - "real_time": 1.0638733175122365e+05, - "cpu_time": 2.1888662572122249e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9712422198011173e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6586, - "real_time": 1.0655233235624783e+05, - "cpu_time": 2.1897106893408709e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9681896713329250e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6586, - "real_time": 1.0654458197327532e+05, - "cpu_time": 2.1896790479806662e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9683328435471554e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0650968367070793e+05, - "cpu_time": 2.1894252593379561e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9689784751980064e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0654458197327532e+05, - "cpu_time": 2.1896790479806662e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9683328435471554e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0971362137923705e+01, - "cpu_time": 5.0868763024251713e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3129904441803070e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.6633717885542919e-04, - "cpu_time": 2.3233843131796852e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6683839397902443e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3423, - "real_time": 2.0470107062159284e+05, - "cpu_time": 4.2023295851592027e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0489897718969551e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3423, - "real_time": 2.0427234413571877e+05, - "cpu_time": 4.1979051329243887e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0532901885207230e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3423, - "real_time": 2.0481956521782529e+05, - "cpu_time": 4.2018020420682686e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0478043665112579e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3423, - "real_time": 2.0447885633343295e+05, - "cpu_time": 4.2022895763949404e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0512164803780830e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3423, - "real_time": 2.0466244320242724e+05, - "cpu_time": 4.2009796085302765e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0493764925162666e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0458685590219946e+05, - "cpu_time": 4.2010611890154163e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0501354599646572e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0466244320242727e+05, - "cpu_time": 4.2018020420682692e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0493764925162666e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1418077978838141e+02, - "cpu_time": 1.8462105099018041e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1472975353108380e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0468941362037855e-03, - "cpu_time": 4.3946289445369693e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0473930026788844e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1743, - "real_time": 4.0191819692833099e+05, - "cpu_time": 7.9615857142854470e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0871431211898659e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1743, - "real_time": 4.0172644389517570e+05, - "cpu_time": 7.9584139013193292e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0881393613682243e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1743, - "real_time": 4.0197969130168244e+05, - "cpu_time": 7.9609844750429934e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0868238325265091e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1743, - "real_time": 4.0169751093075279e+05, - "cpu_time": 7.9584959265632008e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0882897632507565e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1743, - "real_time": 4.0189973294400470e+05, - "cpu_time": 7.9601512392425805e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0872390082351101e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0184431519998936e+05, - "cpu_time": 7.9599262512907118e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0875270173140934e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0189973294400470e+05, - "cpu_time": 7.9601512392425805e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0872390082351101e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2480130500835472e+02, - "cpu_time": 1.4367764000408982e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4837121187665323e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1057128417069619e-04, - "cpu_time": 1.8050122007197281e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1059296789886674e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 879, - "real_time": 7.9631332096943597e+05, - "cpu_time": 1.6578530807736756e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1068611510322762e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 879, - "real_time": 7.9643015434014041e+05, - "cpu_time": 1.6578912980660668e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1065520822601559e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 879, - "real_time": 7.9624032968839584e+05, - "cpu_time": 1.6575035631399802e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1070542868088165e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 879, - "real_time": 7.9641123559215746e+05, - "cpu_time": 1.6575741285552392e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1066021234024403e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 879, - "real_time": 7.9614640133025229e+05, - "cpu_time": 1.6573266882822446e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1073028744421322e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9630828838407644e+05, - "cpu_time": 1.6576297517634411e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1068745035891644e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9631332096943597e+05, - "cpu_time": 1.6575741285552392e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1068611510322762e+10, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1863870356795164e+02, - "cpu_time": 2.3934666362859315e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1390618195887762e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4898589566196964e-04, - "cpu_time": 1.4439090718175652e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4899140002127463e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 78, - "real_time": 8.6040661479227059e+06, - "cpu_time": 1.6717688576923486e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.8998342670925541e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 78, - "real_time": 8.6076231076358221e+06, - "cpu_time": 1.6720215641026488e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.8982227242540236e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 78, - "real_time": 8.6017523366862386e+06, - "cpu_time": 1.6725373576923046e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.9008832952433734e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 78, - "real_time": 8.6005133672211412e+06, - "cpu_time": 1.6719553435896510e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.9014452471970944e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 78, - "real_time": 8.6053564475897029e+06, - "cpu_time": 1.6731167538460879e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.8992495202680826e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6038622814111225e+06, - "cpu_time": 1.6722799753846083e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.8999270108110256e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6040661479227059e+06, - "cpu_time": 1.6720215641026488e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.8998342670925541e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8321811793262787e+03, - "cpu_time": 5.4768771508913142e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2837162024061237e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2917555938166086e-04, - "cpu_time": 3.2750958161964987e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2916416098237777e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 39, - "real_time": 1.7630484910347521e+07, - "cpu_time": 3.3794264230769277e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.8064105633653378e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 39, - "real_time": 1.7635141762021262e+07, - "cpu_time": 3.3766230307693295e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.8054054175240316e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 39, - "real_time": 1.7616540480118532e+07, - "cpu_time": 3.3775696205126248e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.8094235400949998e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 39, - "real_time": 1.7600597574924812e+07, - "cpu_time": 3.3777680179489322e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.8128741773863711e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 39, - "real_time": 1.7635092282524474e+07, - "cpu_time": 3.3808890051283509e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.8054160945050254e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7623571401987322e+07, - "cpu_time": 3.3784552194872335e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.8079059585751534e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7630484910347521e+07, - "cpu_time": 3.3777680179489315e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.8064105633653378e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4930096361663362e+04, - "cpu_time": 1.6941071364359137e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2277928716694321e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4716633315196088e-04, - "cpu_time": 5.0144430705020197e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4765561617945295e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 20, - "real_time": 3.5668646544218063e+07, - "cpu_time": 6.7381422900001556e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7629049880996079e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 20, - "real_time": 3.5645565949380398e+07, - "cpu_time": 6.7393833899996027e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7653414786736755e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 20, - "real_time": 3.5706894844770432e+07, - "cpu_time": 6.7465614550002322e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7588742617774081e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 20, - "real_time": 3.5678669810295105e+07, - "cpu_time": 6.7400685149999619e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7618478691509790e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 20, - "real_time": 3.5677126981317997e+07, - "cpu_time": 6.7388046500002474e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7620105472697363e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5675380825996399e+07, - "cpu_time": 6.7405920600000411e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7621958289942818e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5677126981317997e+07, - "cpu_time": 6.7393833899996027e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.7620105472697363e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2029964103771170e+04, - "cpu_time": 3.4119227265582020e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3230493251414187e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1751167314009700e-04, - "cpu_time": 5.0617552526360441e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1747166567946074e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.1255274944835246e+07, - "cpu_time": 1.3179080155555312e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7672362671790781e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.1122508909967214e+07, - "cpu_time": 1.3168419144444163e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7742686543834939e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.1181426445643112e+07, - "cpu_time": 1.3170525255556086e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7711446567453618e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.1193104816807643e+07, - "cpu_time": 1.3171157877777913e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7705260458963203e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.1269569297631577e+07, - "cpu_time": 1.3184899222222964e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7664806823649573e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1204376882976964e+07, - "cpu_time": 1.3174816331111288e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7699312613138423e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1193104816807643e+07, - "cpu_time": 1.3171157877777913e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7705260458963203e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9575185022323043e+04, - "cpu_time": 6.9384165947964255e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1547014238941851e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.3667869350550919e-04, - "cpu_time": 5.2664237742820763e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.3680608616581347e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4194575250148773e+08, - "cpu_time": 2.5409130259999985e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7822259739288292e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4159298539161682e+08, - "cpu_time": 2.5379205120000276e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7916490743882999e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4171404242515564e+08, - "cpu_time": 2.5399366939998347e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7884101166865034e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4176533520221710e+08, - "cpu_time": 2.5397650540000996e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7870394143546858e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4176908135414124e+08, - "cpu_time": 2.5393175339997926e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7869393444039369e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4175743937492371e+08, - "cpu_time": 2.5395705639999503e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7872527847524514e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4176533520221710e+08, - "cpu_time": 2.5397650540000996e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7870394143546858e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2707096567816280e+05, - "cpu_time": 1.0909603041678030e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3940896642487217e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.9639715727428079e-04, - "cpu_time": 4.2958456033191921e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9618777967855447e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8591477870941162e+08, - "cpu_time": 4.5039911899999654e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7554610812590885e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8626070916652679e+08, - "cpu_time": 4.5071809199998826e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7509228113292027e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8615358471870422e+08, - "cpu_time": 4.5095130650003058e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7523270066859856e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8625221550464630e+08, - "cpu_time": 4.5045546900001907e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7510341085292721e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8649133443832397e+08, - "cpu_time": 4.5124801899999058e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7479033217709970e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8621452450752258e+08, - "cpu_time": 4.5075440110000497e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7515296659149094e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8625221550464630e+08, - "cpu_time": 4.5071809199998826e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7510341085292721e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0840979650171023e+05, - "cpu_time": 3.5331801873491157e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7320322279797508e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.2815940022719766e-04, - "cpu_time": 7.8383709149081363e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2824486843381332e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 94525, - "real_time": 7.3973666712532731e+03, - "cpu_time": 1.4452307103940706e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.4606909644594930e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 94525, - "real_time": 7.4405699555101728e+03, - "cpu_time": 1.4485338640570266e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.4405966415303603e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 94525, - "real_time": 7.4419781148898728e+03, - "cpu_time": 1.4495723618090260e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.4399456172519036e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 94525, - "real_time": 7.4388395471525346e+03, - "cpu_time": 1.4476353906374272e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.4413969864156112e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 94525, - "real_time": 7.4555792819587559e+03, - "cpu_time": 1.4499327215023306e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.4336701457856782e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4348667141529222e+03, - "cpu_time": 1.4481810096799763e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.4432600710886084e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4405699555101719e+03, - "cpu_time": 1.4485338640570268e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.4405966415303603e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1989463766900595e+01, - "cpu_time": 1.8795496324933193e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0214612777780663e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9576137155279082e-03, - "cpu_time": 1.2978692718175256e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9665527920902149e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 88725, - "real_time": 7.9025547221984152e+03, - "cpu_time": 1.4959866644124315e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4789174893251047e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 88725, - "real_time": 7.9741319525012532e+03, - "cpu_time": 1.5016070566356962e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4207615706609979e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 88725, - "real_time": 7.8906961425878226e+03, - "cpu_time": 1.4971727833192834e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4886543689931661e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 88725, - "real_time": 7.9129975636537956e+03, - "cpu_time": 1.4941365116934096e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4703672139586255e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 88725, - "real_time": 7.9157440418337392e+03, - "cpu_time": 1.4968986148210135e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4681222294978544e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9192248845550075e+03, - "cpu_time": 1.4971603261763670e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4653645744871497e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9129975636537956e+03, - "cpu_time": 1.4968986148210137e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.4703672139586255e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2239204911322489e+01, - "cpu_time": 2.7551313832349088e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6211424235793637e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0710051023047896e-03, - "cpu_time": 1.8402380393496690e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0541293431813627e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 80773, - "real_time": 8.8638724190095672e+03, - "cpu_time": 1.5940012987013662e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1552512847589245e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 80773, - "real_time": 8.7633452435345444e+03, - "cpu_time": 1.5832554690304978e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1685035469251779e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 80773, - "real_time": 8.7568052180278155e+03, - "cpu_time": 1.5822177683136095e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1693762445370717e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 80773, - "real_time": 8.6389175893148458e+03, - "cpu_time": 1.5680189271168001e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1853336826207803e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 80773, - "real_time": 8.8142091687040556e+03, - "cpu_time": 1.5891193393832686e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1617604942208984e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7674299277181653e+03, - "cpu_time": 1.5833225605091084e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1680450506125706e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7633452435345425e+03, - "cpu_time": 1.5832554690304978e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1685035469251779e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3866622884877827e+01, - "cpu_time": 9.7860149800999537e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1225586695202170e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5657021015627518e-03, - "cpu_time": 6.1806830927447374e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6105768260522258e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72841, - "real_time": 9.6095911123337646e+03, - "cpu_time": 1.6793625883774188e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1312041022967386e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72841, - "real_time": 9.6452903521370590e+03, - "cpu_time": 1.6831203539215760e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1233160695325622e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72841, - "real_time": 9.6126374044299537e+03, - "cpu_time": 1.6840578341866436e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1305287132293013e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72841, - "real_time": 9.6499711558323943e+03, - "cpu_time": 1.6965687016927066e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1222861363292250e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72841, - "real_time": 9.6511639630719947e+03, - "cpu_time": 1.6981444543594222e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1220238386128458e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6337307975610347e+03, - "cpu_time": 1.6882507865075535e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1258717720001349e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6452903521370572e+03, - "cpu_time": 1.6840578341866432e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1233160695325622e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0790282797152631e+01, - "cpu_time": 8.5143207344248268e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5911827893256437e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1580718035442816e-03, - "cpu_time": 5.0432795900176722e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1596706112739861e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 68454, - "real_time": 1.0222554970884492e+04, - "cpu_time": 1.7486782788441596e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0068260935412699e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 68454, - "real_time": 1.0226290307316822e+04, - "cpu_time": 1.7468369635083494e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0053625282565540e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 68454, - "real_time": 1.0220390030058848e+04, - "cpu_time": 1.7458325678558485e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0076748421081692e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 68454, - "real_time": 1.0225908549021618e+04, - "cpu_time": 1.7447270809594651e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0055120582824808e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 68454, - "real_time": 1.0222139468999259e+04, - "cpu_time": 1.7469479329184232e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0069889600136673e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0223456665256210e+04, - "cpu_time": 1.7466045648172494e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0064728964404279e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0222554970884492e+04, - "cpu_time": 1.7468369635083491e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.0068260935412699e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5491945464228438e+00, - "cpu_time": 1.4657016759634192e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9898331918005511e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4934761596692885e-04, - "cpu_time": 8.3917201723148968e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4934233801197236e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 62344, - "real_time": 1.1224566529809646e+04, - "cpu_time": 1.8631601148467449e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2982773795710444e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 62344, - "real_time": 1.1231352215321349e+04, - "cpu_time": 1.8613407448991944e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2938679536955595e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 62344, - "real_time": 1.1221194767719788e+04, - "cpu_time": 1.8593192785191910e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.3004703773310065e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 62344, - "real_time": 1.1230207775135232e+04, - "cpu_time": 1.8599238387014568e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2946112521069133e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 62344, - "real_time": 1.1222367087761080e+04, - "cpu_time": 1.8605518446042945e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2997077496547532e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1225937675149418e+04, - "cpu_time": 1.8608591643141765e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2973869424718559e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1224566529809646e+04, - "cpu_time": 1.8605518446042945e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.2982773795710444e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6009592416816432e+00, - "cpu_time": 1.4888603763814590e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9905824569805793e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0985077370121807e-04, - "cpu_time": 8.0009299195416624e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0981552445505572e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 62469, - "real_time": 1.1206343514815397e+04, - "cpu_time": 1.8849134386655434e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4620290711541600e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 62469, - "real_time": 1.1210484394138257e+04, - "cpu_time": 1.8842081672509859e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4614890332987638e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 62469, - "real_time": 1.1205046662303273e+04, - "cpu_time": 1.8858263234564409e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4621982838429482e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 62469, - "real_time": 1.1208914559067718e+04, - "cpu_time": 1.8835649137973614e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4616937183043985e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 62469, - "real_time": 1.1206757783981271e+04, - "cpu_time": 1.8856784052889445e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4619750257669513e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1207509382861184e+04, - "cpu_time": 1.8848382496918555e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4618770264734445e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1206757783981271e+04, - "cpu_time": 1.8849134386655434e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.4619750257669513e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1687757958739464e+00, - "cpu_time": 9.6257373107076525e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8287290997902222e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9351095071938954e-04, - "cpu_time": 5.1069301635200395e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9349979844844405e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 62157, - "real_time": 1.1259026095906882e+04, - "cpu_time": 1.9609121611403221e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9103760592501435e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 62157, - "real_time": 1.1258892241104260e+04, - "cpu_time": 1.9574448911626674e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9104106601508918e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 62157, - "real_time": 1.1258801357318105e+04, - "cpu_time": 1.9633190919766992e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9104341536944466e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 62157, - "real_time": 1.1258837298081140e+04, - "cpu_time": 1.9563476213460843e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9104248629283147e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 62157, - "real_time": 1.1258258650078424e+04, - "cpu_time": 1.9613800987820880e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9105744519177256e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1258763128497761e+04, - "cpu_time": 1.9598807728815722e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9104440375883045e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1258837298081142e+04, - "cpu_time": 1.9609121611403221e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.9104248629283147e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9465355191019710e-01, - "cpu_time": 2.8961378427859689e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6171461322466435e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6171041041300618e-05, - "cpu_time": 1.4777112377748558e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6171766348610080e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 55202, - "real_time": 1.2686973153907709e+04, - "cpu_time": 2.3184647621462918e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1656135159247408e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 55202, - "real_time": 1.2692697328785060e+04, - "cpu_time": 2.3160441143437896e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1632839184918213e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 55202, - "real_time": 1.2711856383666585e+04, - "cpu_time": 2.3405630357593636e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1555019205697565e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 55202, - "real_time": 1.2709444866883945e+04, - "cpu_time": 2.3284233143724861e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1564801363403587e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 55202, - "real_time": 1.2695262824641924e+04, - "cpu_time": 2.3215349751820911e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1622405069702425e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2699246911577047e+04, - "cpu_time": 2.3250060403608044e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1606239996593838e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2695262824641924e+04, - "cpu_time": 2.3215349751820908e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.1622405069702425e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0867522596071060e+01, - "cpu_time": 9.8596475543444328e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4156209657623470e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.5576118581991460e-04, - "cpu_time": 4.2406976081723943e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5563702491283820e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 45094, - "real_time": 1.5528669070399939e+04, - "cpu_time": 2.9211974275957687e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4406460982444172e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 45094, - "real_time": 1.5526714265124367e+04, - "cpu_time": 2.9168146338757193e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4417087712118158e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 45094, - "real_time": 1.5529184215609062e+04, - "cpu_time": 2.9205343438148841e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4403660990932026e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 45094, - "real_time": 1.5527174678695417e+04, - "cpu_time": 2.9172978888543836e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4414584566915293e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 45094, - "real_time": 1.5530045484462178e+04, - "cpu_time": 2.9200027675520323e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4398980113186169e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5528357542858193e+04, - "cpu_time": 2.9191694123385580e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4408154873119173e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5528669070399939e+04, - "cpu_time": 2.9200027675520327e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4406460982444172e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3900641477610245e+00, - "cpu_time": 1.9822932734768628e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5560742230340745e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.9517783443899588e-05, - "cpu_time": 6.7906071675670249e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9518296358832039e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 30118, - "real_time": 2.3242995856809663e+04, - "cpu_time": 4.5477439836640151e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1278408412364702e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 30118, - "real_time": 2.3243170971169577e+04, - "cpu_time": 4.5491395876218419e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1278323440685389e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 30118, - "real_time": 2.3243457612626826e+04, - "cpu_time": 4.5453686566171345e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1278184354878094e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 30118, - "real_time": 2.3243442001798612e+04, - "cpu_time": 4.5502092602434670e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1278191929565117e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 30118, - "real_time": 2.3243893997473551e+04, - "cpu_time": 4.5462874360849702e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1277972616313480e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3243392087975652e+04, - "cpu_time": 4.5477497848462852e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1278216150761356e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3243442001798616e+04, - "cpu_time": 4.5477439836640144e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1278191929565117e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4080397808047469e-01, - "cpu_time": 1.9867586781435932e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6536502749977095e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4662402836493929e-05, - "cpu_time": 4.3686631238238754e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4662338909740410e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18975, - "real_time": 3.6888118707416921e+04, - "cpu_time": 7.2497563899875327e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4212923249311270e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18975, - "real_time": 3.6885609915243811e+04, - "cpu_time": 7.2583089275366234e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4213889947996389e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18975, - "real_time": 3.6882575066350350e+04, - "cpu_time": 7.2488830777338531e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4215059524906431e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18975, - "real_time": 3.6887127492686966e+04, - "cpu_time": 7.2570974334643004e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4213305172758232e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18975, - "real_time": 3.6888512216320654e+04, - "cpu_time": 7.2657634888013286e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4212771632682934e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6886388679603740e+04, - "cpu_time": 7.2559618635047285e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4213589905531052e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6887127492686959e+04, - "cpu_time": 7.2570974334643004e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4213305172758232e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4082342562588099e+00, - "cpu_time": 6.9189449456024505e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2801944255494990e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.5287883755083857e-05, - "cpu_time": 9.5355310236712118e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5290996062424876e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 12121, - "real_time": 5.7785560421228191e+04, - "cpu_time": 1.2028927967988279e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8145986512139000e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 12121, - "real_time": 5.7763898647434864e+04, - "cpu_time": 1.2019690116326652e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8152791355030262e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 12121, - "real_time": 5.7759794207771498e+04, - "cpu_time": 1.2032673541787532e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8154081301399712e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 12121, - "real_time": 5.7775791957104564e+04, - "cpu_time": 1.2014960844815888e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8149054551749142e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 12121, - "real_time": 5.7782383071286116e+04, - "cpu_time": 1.2029607647884985e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8146984327496014e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.7773485660965067e+04, - "cpu_time": 1.2025172023760667e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8149779609562828e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.7775791957104564e+04, - "cpu_time": 1.2028927967988283e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8149054551749142e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1287708617504526e+01, - "cpu_time": 7.4895616642039613e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5461973330766577e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9537870163736934e-04, - "cpu_time": 6.2282366101751015e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9538514568012843e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6554, - "real_time": 1.0682966744104722e+05, - "cpu_time": 2.2039354653646934e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9630801538882355e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6554, - "real_time": 1.0708349296031080e+05, - "cpu_time": 2.2097392401588309e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9584269638806835e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6554, - "real_time": 1.0680433278310632e+05, - "cpu_time": 2.2050945514187138e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9635458088192047e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6554, - "real_time": 1.0687461505665303e+05, - "cpu_time": 2.2043006454074426e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9622545530464119e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6554, - "real_time": 1.0709147285072690e+05, - "cpu_time": 2.2074622184924339e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9582810322565895e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0693671621836885e+05, - "cpu_time": 2.2061064241684228e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9611177023782253e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0687461505665304e+05, - "cpu_time": 2.2050945514187138e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.9622545530464119e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3994141289260480e+02, - "cpu_time": 2.4511892923974946e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5654491466270775e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3086376488954375e-03, - "cpu_time": 1.1110929488913730e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3081566412439121e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3433, - "real_time": 2.0392353367219804e+05, - "cpu_time": 4.2054365540341765e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0568023339288727e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3433, - "real_time": 2.0399046644614966e+05, - "cpu_time": 4.2066594115933694e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0561274617739212e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3433, - "real_time": 2.0395983616090217e+05, - "cpu_time": 4.2066348674628069e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0564362469340038e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3433, - "real_time": 2.0412329139435207e+05, - "cpu_time": 4.2098412612878939e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0547895202693428e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3433, - "real_time": 2.0396725754865314e+05, - "cpu_time": 4.2075678473643417e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0563614231070961e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0399287704445102e+05, - "cpu_time": 4.2072279883485177e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0561033972026470e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0396725754865314e+05, - "cpu_time": 4.2066594115933694e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0563614231070961e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6763069662455763e+01, - "cpu_time": 1.6453729389930433e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7342267929302407e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7630269632271879e-04, - "cpu_time": 3.9108242851343774e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7615942872584848e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1751, - "real_time": 3.9966002614013973e+05, - "cpu_time": 7.9455092861222546e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0989359583984402e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1751, - "real_time": 3.9977195767698006e+05, - "cpu_time": 7.9470035808101250e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0983482805409988e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1751, - "real_time": 3.9988801052231662e+05, - "cpu_time": 7.9472441176475759e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0977393118246178e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1751, - "real_time": 3.9969628557364974e+05, - "cpu_time": 7.9448311993139412e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0987455482506054e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1751, - "real_time": 3.9975083637400198e+05, - "cpu_time": 7.9466567846940609e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0984591492265751e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9975342325741763e+05, - "cpu_time": 7.9462489937175927e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0984456496482475e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9975083637400193e+05, - "cpu_time": 7.9466567846940621e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.0984591492265751e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7252055713263928e+01, - "cpu_time": 1.0348037328066937e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5796231944211302e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1826468677187225e-04, - "cpu_time": 1.3022543512351841e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1823882811493309e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 885, - "real_time": 7.9043965732762963e+05, - "cpu_time": 1.6493589096045599e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1225169871564285e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 885, - "real_time": 7.9066763088727999e+05, - "cpu_time": 1.6494661050849361e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1219050008627220e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 885, - "real_time": 7.9033550593244319e+05, - "cpu_time": 1.6490581875705123e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1227966950828213e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 885, - "real_time": 7.9055064874780120e+05, - "cpu_time": 1.6493218237287358e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1222189908482651e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 885, - "real_time": 7.9033297702333343e+05, - "cpu_time": 1.6491504734462954e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1228034876121178e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9046528398369753e+05, - "cpu_time": 1.6492710998870081e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1224482323124710e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9043965732762951e+05, - "cpu_time": 1.6493218237287358e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1225169871564285e+10, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4425291298122960e+02, - "cpu_time": 1.6446342237157512e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8730218129414143e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8249114275359452e-04, - "cpu_time": 9.9718853002906885e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8247897658835434e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 75, - "real_time": 9.2094526315728817e+06, - "cpu_time": 1.8055919546668518e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6434773425040398e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 75, - "real_time": 9.2294038087129593e+06, - "cpu_time": 1.8083185559999038e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6356012474308639e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 75, - "real_time": 9.3339869876702633e+06, - "cpu_time": 1.8179442386666171e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5948659500301161e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 75, - "real_time": 9.2271487911542263e+06, - "cpu_time": 1.8080985359999128e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6364897499179344e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 75, - "real_time": 9.2283093680938091e+06, - "cpu_time": 1.8080569613333259e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6360324152126875e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2456603174408264e+06, - "cpu_time": 1.8096020493333228e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6292933410191288e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time_median", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2283093680938073e+06, - "cpu_time": 1.8080985359999128e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6360324152126875e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0051481782579220e+04, - "cpu_time": 4.7950022552727991e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9515533900824748e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4135107784744280e-03, - "cpu_time": 2.6497550978345384e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3772269329281225e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 38, - "real_time": 1.8346507053234074e+07, - "cpu_time": 3.5705407078951694e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6578550786412621e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 38, - "real_time": 1.8342965429550722e+07, - "cpu_time": 3.5688169500004783e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6585613301046114e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 38, - "real_time": 1.8326047954982832e+07, - "cpu_time": 3.5699496684209839e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6619386877547250e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 38, - "real_time": 1.8302270309313346e+07, - "cpu_time": 3.5681600763155080e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6666961456607261e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 38, - "real_time": 1.8329815939068794e+07, - "cpu_time": 3.5682376973682038e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6611859182372847e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8329521337229952e+07, - "cpu_time": 3.5691410200000688e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6612474320797219e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time_median", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8329815939068794e+07, - "cpu_time": 3.5688169500004783e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6611859182372847e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7493054789854952e+04, - "cpu_time": 1.0602242822715274e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4961873421657486e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5436506322311792e-04, - "cpu_time": 2.9705306580223240e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5491698035272824e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.6459562417707942e+07, - "cpu_time": 6.9886123473691583e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6812764361322165e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.6519166866415426e+07, - "cpu_time": 6.9986495052633375e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6752680719951558e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.6439167041527599e+07, - "cpu_time": 6.9847428210526854e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6833368843760853e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.6538670525739066e+07, - "cpu_time": 6.9979573210527003e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6733062825986657e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.6492792595373958e+07, - "cpu_time": 6.9904025789475396e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6779242818762584e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6489871889352798e+07, - "cpu_time": 6.9920729147370845e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6782223913956766e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time_median", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6492792595373958e+07, - "cpu_time": 6.9904025789475396e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6779242818762584e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1041682411149115e+04, - "cpu_time": 6.0492479323753287e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1373368794914442e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1247417512343875e-03, - "cpu_time": 8.6515801624800293e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1248196653823206e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.2489783167839050e+07, - "cpu_time": 1.3557895433331800e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7030798585571513e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.2529182665877879e+07, - "cpu_time": 1.3552706800000024e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.7010682615383768e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.2609995802243546e+07, - "cpu_time": 1.3559345388888586e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6969490637500587e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.2621678312619522e+07, - "cpu_time": 1.3575145066665250e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6963543426309628e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.2568363613552511e+07, - "cpu_time": 1.3571991788889036e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6990699890863776e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2563800712426513e+07, - "cpu_time": 1.3563416895554939e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6993043031125855e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time_median", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2568363613552526e+07, - "cpu_time": 1.3559345388888586e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6990699890863776e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5185208727295932e+04, - "cpu_time": 9.6546446311566309e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8138359321040735e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.6050604000191919e-04, - "cpu_time": 7.1181507620846573e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6063921795687880e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4323308765888214e+08, - "cpu_time": 2.5948071080001682e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7482324843725286e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4333968758583069e+08, - "cpu_time": 2.5978127099997434e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7454449709088831e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4282758533954620e+08, - "cpu_time": 2.5928347640001449e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7588741049124970e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4339115023612976e+08, - "cpu_time": 2.5974664339996704e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7441007420325899e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4335143566131592e+08, - "cpu_time": 2.5954030180000702e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7451380205805445e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4322858929634094e+08, - "cpu_time": 2.5956648067999595e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7483580645614085e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time_median", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4333968758583069e+08, - "cpu_time": 2.5954030180000702e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7454449709088831e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3167030835270439e+05, - "cpu_time": 2.0416091436119328e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0741762413680423e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6174864912854579e-03, - "cpu_time": 7.8654575824407434e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6204898616265933e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8848634660243988e+08, - "cpu_time": 4.5634266499996555e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7219848933776846e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8809632360935211e+08, - "cpu_time": 4.5605546100000536e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7270236931449146e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8869147598743439e+08, - "cpu_time": 4.5693040950004613e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7193402414373183e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8752599656581879e+08, - "cpu_time": 4.5548953999991679e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7344164938985100e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8813619911670685e+08, - "cpu_time": 4.5612091899999994e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7265079059541941e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8818726837635040e+08, - "cpu_time": 4.5618779889998674e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7258546455625248e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time_median", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8813619911670685e+08, - "cpu_time": 4.5612091900000000e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7265079059541941e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4492486101884814e+05, - "cpu_time": 5.2081804516891466e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7556735353701217e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5438741049372470e-03, - "cpu_time": 1.1416746489598623e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5447928281971765e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 97108, - "real_time": 7.2132160886614001e+03, - "cpu_time": 1.4401502337602102e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5490410498364463e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 97108, - "real_time": 7.2140173319569913e+03, - "cpu_time": 1.4380872338015097e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5486468665102765e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 97108, - "real_time": 7.2209428740272388e+03, - "cpu_time": 1.4369776856697326e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5452433908707075e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 97108, - "real_time": 7.1994045256284508e+03, - "cpu_time": 1.4342969158051721e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5558496412958995e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 97108, - "real_time": 7.2221654906725380e+03, - "cpu_time": 1.4394541047081068e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5446432282758579e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2139492621893241e+03, - "cpu_time": 1.4377932347489463e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5486848353578381e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time_median", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2140173319569922e+03, - "cpu_time": 1.4380872338015097e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.5486468665102765e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0624024895589361e+00, - "cpu_time": 2.3070400548308506e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4620875849343211e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2562331893652152e-03, - "cpu_time": 1.6045701141678300e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2573919048757618e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 94612, - "real_time": 7.4279793171047995e+03, - "cpu_time": 1.4657860324271765e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.8928571034250274e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 94612, - "real_time": 7.4044449526348644e+03, - "cpu_time": 1.4597628989981342e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9147654317803428e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 94612, - "real_time": 7.4009014135266452e+03, - "cpu_time": 1.4624103824038679e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9180762098008275e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 94612, - "real_time": 7.3773934304591821e+03, - "cpu_time": 1.4561986006002890e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9401205835938752e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 94612, - "real_time": 7.4010886183782650e+03, - "cpu_time": 1.4637251352893818e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9179012223770678e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4023615464207496e+03, - "cpu_time": 1.4615766099437698e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9167441101954281e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time_median", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4010886183782641e+03, - "cpu_time": 1.4624103824038679e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 6.9179012223770678e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7942755535663785e+01, - "cpu_time": 3.7162853500168652e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6763630030888299e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4239231525160520e-03, - "cpu_time": 2.5426551880573939e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4236302173125577e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 92912, - "real_time": 7.5224911135683260e+03, - "cpu_time": 1.4712475180815631e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3612511926441628e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 92912, - "real_time": 7.5369395224518175e+03, - "cpu_time": 1.4721529533321622e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3586416568019456e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 92912, - "real_time": 7.5232842435611346e+03, - "cpu_time": 1.4729839525572035e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3611076849534148e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 92912, - "real_time": 7.5378963073296500e+03, - "cpu_time": 1.4740861040554413e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3584692044706020e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 92912, - "real_time": 7.5254081038709983e+03, - "cpu_time": 1.4753633179782859e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3607235459738910e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5292038581563875e+03, - "cpu_time": 1.4731667692009312e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3600386569688031e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time_median", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5254081038709992e+03, - "cpu_time": 1.4729839525572035e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3607235459738910e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5813867818172032e+00, - "cpu_time": 1.6135963331098363e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3690258542116726e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0069307359242619e-03, - "cpu_time": 1.0953249603811498e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0066080454381346e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 88945, - "real_time": 7.8878217392966790e+03, - "cpu_time": 1.5234284535387200e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5964075605271107e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 88945, - "real_time": 7.8813743933828482e+03, - "cpu_time": 1.5197355635503407e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5985315476441365e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 88945, - "real_time": 7.8917740153919794e+03, - "cpu_time": 1.5232073865873315e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5951072547257644e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 88945, - "real_time": 7.8513747392298637e+03, - "cpu_time": 1.5223740052841264e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6084603881751376e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 88945, - "real_time": 7.8468795797652392e+03, - "cpu_time": 1.5187749901626117e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6099546694729212e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8718448934133221e+03, - "cpu_time": 1.5215040798246260e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6016922841090143e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time_median", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8813743933828473e+03, - "cpu_time": 1.5223740052841264e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5985315476441365e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1127795523234632e+01, - "cpu_time": 2.1175940721753911e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9884800719469751e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6839699980512922e-03, - "cpu_time": 1.3917767952482075e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6861286073807445e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 81033, - "real_time": 8.6439451795679197e+03, - "cpu_time": 1.5973479915592214e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7385770211522144e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 81033, - "real_time": 8.6409287029265270e+03, - "cpu_time": 1.5975486073577014e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7402312191428673e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 81033, - "real_time": 8.6434666660911444e+03, - "cpu_time": 1.6011541877999685e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7388393548954856e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 81033, - "real_time": 8.6359667405607943e+03, - "cpu_time": 1.5966425357570299e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7429548110256135e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 81033, - "real_time": 8.6466316587177353e+03, - "cpu_time": 1.6005008811226384e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7371047613324869e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6421877895728267e+03, - "cpu_time": 1.5986388407193121e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7395414335097343e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time_median", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6434666660911462e+03, - "cpu_time": 1.5975486073577016e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.7388393548954856e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0236385162642110e+00, - "cpu_time": 2.0392583969403056e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2072226403333218e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6558100960487171e-04, - "cpu_time": 1.2756217007856105e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6570383892578928e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65538, - "real_time": 1.0685370703899078e+04, - "cpu_time": 1.8237997970645509e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6665566661255383e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65538, - "real_time": 1.0681483497079565e+04, - "cpu_time": 1.8195590008851821e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6693466803930211e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65538, - "real_time": 1.0683712662237778e+04, - "cpu_time": 1.8239541960390328e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6677464650983310e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65538, - "real_time": 1.0683380713768544e+04, - "cpu_time": 1.8214674463671618e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6679847133429420e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65538, - "real_time": 1.0686181182954302e+04, - "cpu_time": 1.8228672144405220e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6659752064350069e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0684025751987854e+04, - "cpu_time": 1.8223295309592901e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6675219462789679e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time_median", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0683712662237778e+04, - "cpu_time": 1.8228672144405216e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 7.6677464650983310e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8324804030108972e+00, - "cpu_time": 1.8377533363925444e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3151413003932315e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7151591034586831e-04, - "cpu_time": 1.0084637850461301e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7152103503681091e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65634, - "real_time": 1.0667301117354687e+04, - "cpu_time": 1.8530191867019079e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5359086445347254e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65634, - "real_time": 1.0667687025473682e+04, - "cpu_time": 1.8534143264162645e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5358530823857286e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65634, - "real_time": 1.0667276980811426e+04, - "cpu_time": 1.8541631806685135e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5359121197913923e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65634, - "real_time": 1.0664836826813314e+04, - "cpu_time": 1.8533774629005202e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5362635421488760e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65634, - "real_time": 1.0671513546104805e+04, - "cpu_time": 1.8537995459668869e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5353023663621085e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0667723099311581e+04, - "cpu_time": 1.8535547405308185e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5358479510445662e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time_median", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0667301117354686e+04, - "cpu_time": 1.8534143264162642e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.5359086445347254e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4018975642320464e+00, - "cpu_time": 4.3820385830021582e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4576229892803525e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2515559711022568e-04, - "cpu_time": 2.3641268785766940e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2512794882649303e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 64416, - "real_time": 1.0864360169022946e+04, - "cpu_time": 1.9524861540609203e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0161003032125077e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 64416, - "real_time": 1.0870672073237896e+04, - "cpu_time": 1.9503293063834783e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0143490466123362e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 64416, - "real_time": 1.0864017747642190e+04, - "cpu_time": 1.9521214154869300e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0161953672352586e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 64416, - "real_time": 1.0868887841594193e+04, - "cpu_time": 1.9508827232365409e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0148438807694750e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 64416, - "real_time": 1.0863535777362418e+04, - "cpu_time": 1.9527118014157815e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0163291833845105e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0866294721771930e+04, - "cpu_time": 1.9517062801167303e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0155635562428179e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time_median", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0864360169022946e+04, - "cpu_time": 1.9521214154869296e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0161003032125077e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2566990968546117e+00, - "cpu_time": 1.0447387739552255e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0366390070645185e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9970649427807469e-04, - "cpu_time": 5.3529508235877613e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9966667385792196e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 55658, - "real_time": 1.2588766208202469e+04, - "cpu_time": 2.2766560835818193e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2059112796374502e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 55658, - "real_time": 1.2587719891332261e+04, - "cpu_time": 2.2760620090556127e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2063440055674601e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 55658, - "real_time": 1.2596926900457409e+04, - "cpu_time": 2.2783652987890957e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2025387237597065e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 55658, - "real_time": 1.2588078620158352e+04, - "cpu_time": 2.2765376226236694e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2061956377561607e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 55658, - "real_time": 1.2588245075206085e+04, - "cpu_time": 2.2768989669051527e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2061267959487276e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2589947339071314e+04, - "cpu_time": 2.2769039961910697e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2054232885339012e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time_median", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2588245075206083e+04, - "cpu_time": 2.2766560835818196e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2061267959487276e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9198432128698535e+00, - "cpu_time": 8.7178884517492659e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6200320297080548e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1134706979314475e-04, - "cpu_time": 3.8288344463943274e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1122003724010967e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 46786, - "real_time": 1.4969641488187308e+04, - "cpu_time": 2.8160178600436335e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7558543137743282e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 46786, - "real_time": 1.4964800502935523e+04, - "cpu_time": 2.8142805988971329e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7586867579216099e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 46786, - "real_time": 1.4968010566623771e+04, - "cpu_time": 2.8160909246351501e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7568083558324871e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 46786, - "real_time": 1.4963250112067732e+04, - "cpu_time": 2.8142232505450324e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7595942738597641e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 46786, - "real_time": 1.4970858924059175e+04, - "cpu_time": 2.8167066002648440e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7551422844121838e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4967312318774702e+04, - "cpu_time": 2.8154638468771584e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7572171971600761e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time_median", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4968010566623771e+04, - "cpu_time": 2.8160178600436331e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.7568083558324871e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2133211518728375e+00, - "cpu_time": 1.1383923012716840e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8801574225154659e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1468925638988044e-04, - "cpu_time": 4.0433561330732769e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1469804621554803e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 30942, - "real_time": 2.2625834357663716e+04, - "cpu_time": 4.3729642783272997e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1586047871476963e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 30942, - "real_time": 2.2622116333916936e+04, - "cpu_time": 4.3725866362872235e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1587952078867712e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 30942, - "real_time": 2.2624240502030814e+04, - "cpu_time": 4.3732560823473672e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1586864097226566e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 30942, - "real_time": 2.2622854874948283e+04, - "cpu_time": 4.3746060694197389e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1587573780985910e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 30942, - "real_time": 2.2623651431171686e+04, - "cpu_time": 4.3740444153573175e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1587165794059597e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2623739499946289e+04, - "cpu_time": 4.3734914963477888e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1587120724523350e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time_median", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2623651431171686e+04, - "cpu_time": 4.3732560823473657e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1587165794059597e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4198958337705361e+00, - "cpu_time": 8.2160557178899527e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2720572759020538e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.2761323510373117e-05, - "cpu_time": 1.8786033366592817e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2759830062970181e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19299, - "real_time": 3.6273046605437929e+04, - "cpu_time": 7.0700937924243815e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4453927890396738e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19299, - "real_time": 3.6268733986373976e+04, - "cpu_time": 7.0704884346345556e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4455646568666361e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19299, - "real_time": 3.6274459629282064e+04, - "cpu_time": 7.0693097362554661e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4453364856654560e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19299, - "real_time": 3.6269823979604451e+04, - "cpu_time": 7.0705163635419696e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4455212142601576e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19299, - "real_time": 3.6273724500817756e+04, - "cpu_time": 7.0694771594382255e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4453657770604187e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6271957740303238e+04, - "cpu_time": 7.0699770972589205e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4454361845784687e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time_median", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6273046605437936e+04, - "cpu_time": 7.0700937924243830e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.4453927890396738e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5254723046818319e+00, - "cpu_time": 5.6151587138247923e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0064223539647756e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.9626026881799033e-05, - "cpu_time": 7.9422587040654314e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9627588177355456e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 12468, - "real_time": 5.6191321961527705e+04, - "cpu_time": 1.1658600393005145e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8660817425116364e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 12468, - "real_time": 5.6199224841688832e+04, - "cpu_time": 1.1663674550849109e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8658193292768723e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 12468, - "real_time": 5.6172093441466364e+04, - "cpu_time": 1.1660875986526057e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8667205292832096e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 12468, - "real_time": 5.6177561841532290e+04, - "cpu_time": 1.1662710033687430e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8665388201749683e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 12468, - "real_time": 5.6162179433924241e+04, - "cpu_time": 1.1661098331729081e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8670500514205784e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6180476304027892e+04, - "cpu_time": 1.1661391859159363e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8664420945334530e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time_median", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6177561841532282e+04, - "cpu_time": 1.1661098331729083e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8665388201749683e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4854947688199555e+01, - "cpu_time": 1.9424746841010993e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9350366717664823e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6441476942648350e-04, - "cpu_time": 1.6657314217388166e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6440877465314956e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6771, - "real_time": 1.0333879751651482e+05, - "cpu_time": 2.1525926598729569e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0293946227358116e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6771, - "real_time": 1.0344069532997896e+05, - "cpu_time": 2.1533111844633703e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0273954977874245e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6771, - "real_time": 1.0331194139280819e+05, - "cpu_time": 2.1519352015950455e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0299221674930099e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6771, - "real_time": 1.0332542246029749e+05, - "cpu_time": 2.1522887830456090e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0296573196260822e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6771, - "real_time": 1.0344180946380939e+05, - "cpu_time": 2.1545220056120559e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0273736614533207e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0337173323268177e+05, - "cpu_time": 2.1529299669178078e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0287486538191296e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time_median", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0333879751651481e+05, - "cpu_time": 2.1525926598729566e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.0293946227358116e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4169623219720620e+01, - "cpu_time": 1.0240074301432887e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2591384937659558e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.2076566981110568e-04, - "cpu_time": 4.7563434290864799e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2064785176597470e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4189, - "real_time": 1.6723229519686158e+05, - "cpu_time": 3.6051430174264498e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5080705823373249e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4189, - "real_time": 1.6722248101214116e+05, - "cpu_time": 3.6034653926950129e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5082177794596130e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4189, - "real_time": 1.6729711859822596e+05, - "cpu_time": 3.6046633874430909e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5070987684329887e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4189, - "real_time": 1.6710670682567504e+05, - "cpu_time": 3.6024631749817979e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5099555126626240e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4189, - "real_time": 1.6715407121849176e+05, - "cpu_time": 3.6031099379322707e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5092442974466999e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6720253457027912e+05, - "cpu_time": 3.6037689820957248e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5085173880678497e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time_median", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6722248101214116e+05, - "cpu_time": 3.6034653926950129e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5082177794596130e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3758638248693600e+01, - "cpu_time": 1.1090054059047354e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1066257222356617e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.4113349380891793e-04, - "cpu_time": 3.0773487740598949e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4114731972738077e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2172, - "real_time": 3.2187288545934367e+05, - "cpu_time": 7.0942657918973768e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.6061865969320923e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2172, - "real_time": 3.2201739348131139e+05, - "cpu_time": 7.0896637983423297e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.6050170487100853e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2172, - "real_time": 3.2184954111881956e+05, - "cpu_time": 7.0946096270718111e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.6063756284502872e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2172, - "real_time": 3.2218032515252742e+05, - "cpu_time": 7.0968056399635877e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.6036996505074123e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2172, - "real_time": 3.2197829543299455e+05, - "cpu_time": 7.0953489963175158e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.6053333777418285e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2197968812899932e+05, - "cpu_time": 7.0941387707185256e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.6053224604683414e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time_median", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2197829543299455e+05, - "cpu_time": 7.0946096270718123e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.6053333777418285e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3231014977646834e+02, - "cpu_time": 2.6851468947711192e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0703740373054646e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1092700767962430e-04, - "cpu_time": 3.7850216658493076e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1084128876432848e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1103, - "real_time": 6.3504544773847470e+05, - "cpu_time": 1.4964723544877220e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.6418921763390415e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1103, - "real_time": 6.3493215958760912e+05, - "cpu_time": 1.4960207733453626e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.6423635575329597e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1103, - "real_time": 6.3489764318349736e+05, - "cpu_time": 1.4960380135993280e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.6425072104340874e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1103, - "real_time": 6.3505314756184816e+05, - "cpu_time": 1.4962773472348193e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.6418601442119549e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1103, - "real_time": 6.3487399847171560e+05, - "cpu_time": 1.4959598068903815e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.6426056257440895e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3496047930862906e+05, - "cpu_time": 1.4961536591115226e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.6422457428524269e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time_median", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3493215958760923e+05, - "cpu_time": 1.4960380135993280e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.6423635575329597e+10, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3720307817750566e+01, - "cpu_time": 2.1533502366096914e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4837367560709864e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3185121050196489e-04, - "cpu_time": 1.4392574074834256e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3184756813384554e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 73, - "real_time": 9.3105812748409305e+06, - "cpu_time": 1.8184640890411496e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6039030227544279e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 73, - "real_time": 9.2828594505378641e+06, - "cpu_time": 1.8149636972600702e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6146655218458362e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 73, - "real_time": 9.3176782590477429e+06, - "cpu_time": 1.8179478712329924e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6011580425003028e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 73, - "real_time": 9.2829821809922177e+06, - "cpu_time": 1.8145368958902795e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6146177322957559e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 73, - "real_time": 9.3242317973955031e+06, - "cpu_time": 1.8184441164381396e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5986269677865162e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3036665925628524e+06, - "cpu_time": 1.8168713339725263e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6065942574365678e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time_median", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3105812748409286e+06, - "cpu_time": 1.8179478712329920e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6039030227544279e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9543856578008843e+04, - "cpu_time": 1.9530824902384891e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5794844695612378e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1006617534673668e-03, - "cpu_time": 1.0749701719208380e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1015628397712950e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 38, - "real_time": 1.8524499904168278e+07, - "cpu_time": 3.5849097736840308e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6227085398888173e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 38, - "real_time": 1.8493952327652980e+07, - "cpu_time": 3.5841885894737251e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6286923860864415e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 38, - "real_time": 1.8483105752813190e+07, - "cpu_time": 3.5852835342103913e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6308218379254694e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 38, - "real_time": 1.8531417621201590e+07, - "cpu_time": 3.5899157289469779e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6213561947479663e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 38, - "real_time": 1.8531005143334992e+07, - "cpu_time": 3.5883054736844219e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6214368017774205e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8512796149834208e+07, - "cpu_time": 3.5865206199999101e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6250031520852237e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time_median", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8524499904168278e+07, - "cpu_time": 3.5852835342103913e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.6227085398888173e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2649027657165218e+04, - "cpu_time": 2.4635361226928755e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4371147682069261e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2234255416553081e-03, - "cpu_time": 6.8688748336066655e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2240305958505300e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.6808408796787262e+07, - "cpu_time": 7.0255979315788865e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6463876703008928e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.7158034937946416e+07, - "cpu_time": 7.0622531368419588e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6120782012327180e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.6922977158897802e+07, - "cpu_time": 7.0433173315785483e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6350732884402804e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.6798253067229927e+07, - "cpu_time": 7.0336989263152733e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6473940150035377e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.6936072142500624e+07, - "cpu_time": 7.0400483263160586e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6337845421728501e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6924749220672406e+07, - "cpu_time": 7.0409831305261448e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6349435434300561e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time_median", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6922977158897802e+07, - "cpu_time": 7.0400483263160571e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6350732884402804e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4499133225014957e+05, - "cpu_time": 1.3679359449339780e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4231709961564001e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.9266707373865070e-03, - "cpu_time": 1.9428195176371026e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9152492443209931e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.3295501371224716e+07, - "cpu_time": 1.3643885200000721e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6623728738880801e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.3300407164626658e+07, - "cpu_time": 1.3656018499998227e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6621277614067841e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.3359765112400055e+07, - "cpu_time": 1.3662461866665074e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6591646059486380e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.3200994067721903e+07, - "cpu_time": 1.3645922766666749e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6671012384293160e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.3308530781004161e+07, - "cpu_time": 1.3653066133333090e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6617219461388726e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3293039699395508e+07, - "cpu_time": 1.3652270893332773e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6624976851623383e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time_median", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3300407164626658e+07, - "cpu_time": 1.3653066133333093e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6621277614067841e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.7499982683200142e+04, - "cpu_time": 7.5688748273339588e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8747309525032076e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8452173520201802e-04, - "cpu_time": 5.5440409046016636e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8490997117880413e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4451138377189636e+08, - "cpu_time": 2.6104625819998544e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7150769578639050e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4436123669147491e+08, - "cpu_time": 2.6064608760002556e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7189409311267300e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4398314952850342e+08, - "cpu_time": 2.6067128519998732e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7287065448844008e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4442610144615173e+08, - "cpu_time": 2.6070687880001059e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7172706776978855e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4404343962669373e+08, - "cpu_time": 2.6069400139999741e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7271458762118354e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4426506221294403e+08, - "cpu_time": 2.6075290224000129e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7214281975569515e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time_median", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4436123669147491e+08, - "cpu_time": 2.6069400139999741e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7189409311267300e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3688014255084848e+05, - "cpu_time": 1.6561694791594756e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1130168559361920e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6419785838458858e-03, - "cpu_time": 6.3514901078075433e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6426534468538918e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.9113595187664032e+08, - "cpu_time": 4.5888100950003260e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6881114032078190e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.9153901338577271e+08, - "cpu_time": 4.5981865599992490e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6830124775760093e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.9274109005928040e+08, - "cpu_time": 4.6071894249996603e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6678889997388687e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.9127867519855499e+08, - "cpu_time": 4.5860142899994117e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6863042695043359e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.9166996479034424e+08, - "cpu_time": 4.6019867100005740e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6813589111646037e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9167293906211853e+08, - "cpu_time": 4.5964374159998447e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6813352122383270e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time_median", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9153901338577271e+08, - "cpu_time": 4.5981865599992484e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6830124775760093e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3298710833875660e+05, - "cpu_time": 8.8920954705056676e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9721814050208367e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPageable/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1701948434919675e-03, - "cpu_time": 1.9345625025923270e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1655679109356596e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - } - ] -} diff --git a/results/hipMemcpyAsync_GPUToPinned.json b/results/hipMemcpyAsync_GPUToPinned.json deleted file mode 100644 index cc16236..0000000 --- a/results/hipMemcpyAsync_GPUToPinned.json +++ /dev/null @@ -1,3858 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:55:39-04:00", - "host_name": "frontier10465", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1796, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [6.47,11.33,11.88], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52235, - "real_time": 1.3454085324331463e+04, - "cpu_time": 2.0377894783191343e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 1.9027677752052665e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52235, - "real_time": 1.3337203987187244e+04, - "cpu_time": 2.0289086359720488e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 1.9194427876032602e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52235, - "real_time": 1.3186539730989720e+04, - "cpu_time": 2.0082922427491154e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 1.9413735917268258e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52235, - "real_time": 1.3334940758000001e+04, - "cpu_time": 2.0219355929932044e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 1.9197685587498281e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52235, - "real_time": 1.3183338191850033e+04, - "cpu_time": 2.0146454235665744e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 1.9418450492171984e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3299221598471693e+04, - "cpu_time": 2.0223142747200160e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 1.9250395525004759e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3334940758000002e+04, - "cpu_time": 2.0219355929932040e+04, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 1.9197685587498281e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1492112619808184e+02, - "cpu_time": 1.1603227839795277e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6615992098446153e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.6411919184268809e-03, - "cpu_time": 5.7375987426097324e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6315068575413302e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52205, - "real_time": 1.3247311615410497e+04, - "cpu_time": 2.0172652945120200e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 3.8649351269460157e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52205, - "real_time": 1.3286441682410798e+04, - "cpu_time": 2.0238151498898569e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 3.8535524577495351e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52205, - "real_time": 1.3318225952499288e+04, - "cpu_time": 2.0290479858251147e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 3.8443558611041471e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52205, - "real_time": 1.3323327234518472e+04, - "cpu_time": 2.0287575653673044e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 3.8428839207183562e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52205, - "real_time": 1.3326873080040150e+04, - "cpu_time": 2.0313490144622177e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 3.8418614548586778e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3300435912975841e+04, - "cpu_time": 2.0260470020113033e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 3.8495177642753467e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3318225952499290e+04, - "cpu_time": 2.0287575653673044e+04, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 3.8443558611041471e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3754449304474456e+01, - "cpu_time": 5.6250320904968305e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7883351717426907e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5378453402075171e-03, - "cpu_time": 2.7763581421915351e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5427432138594892e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52479, - "real_time": 1.3428744710109755e+04, - "cpu_time": 2.0394118275881789e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 7.6254335167239219e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52479, - "real_time": 1.3314139275841755e+04, - "cpu_time": 2.0264469902246623e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 7.6910717154508665e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52479, - "real_time": 1.3351280570019146e+04, - "cpu_time": 2.0291210712856559e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 7.6696762878269106e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52479, - "real_time": 1.3333394843860455e+04, - "cpu_time": 2.0274975132910356e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 7.6799645700998262e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52479, - "real_time": 1.3319397647958092e+04, - "cpu_time": 2.0283799386421284e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 7.6880353531376287e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3349391409557842e+04, - "cpu_time": 2.0301714682063324e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 7.6708362886478320e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3333394843860460e+04, - "cpu_time": 2.0283799386421284e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 7.6799645700998262e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6633528753775536e+01, - "cpu_time": 5.2611530224362411e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6699078353475052e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4933074717089386e-03, - "cpu_time": 2.5914821013047228e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4805955112074752e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52128, - "real_time": 1.3468469297934842e+04, - "cpu_time": 2.0451500153468442e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.5205885351158839e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52128, - "real_time": 1.3456059822556450e+04, - "cpu_time": 2.0469015903161475e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.5219908554262882e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52128, - "real_time": 1.3475397379251719e+04, - "cpu_time": 2.0529924320902384e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.5198067577237743e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52128, - "real_time": 1.3475203561443317e+04, - "cpu_time": 2.0522792702578263e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.5198286175505021e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52128, - "real_time": 1.3487248049730617e+04, - "cpu_time": 2.0534116693523672e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.5184713682498819e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3472475622183390e+04, - "cpu_time": 2.0501469954726846e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.5201372268132663e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3475203561443317e+04, - "cpu_time": 2.0522792702578263e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.5198286175505021e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1398816209536109e+01, - "cpu_time": 3.8341774167241141e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2863856797243975e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4608178401652839e-04, - "cpu_time": 1.8701963445504554e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4622996992258853e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51576, - "real_time": 1.3570238159934961e+04, - "cpu_time": 2.0635467329765728e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0183700180687404e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51576, - "real_time": 1.3617236896091308e+04, - "cpu_time": 2.0704426516209089e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0079523704076236e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51576, - "real_time": 1.3633417601955982e+04, - "cpu_time": 2.0761581917946289e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0043824076894319e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51576, - "real_time": 1.3636821748398545e+04, - "cpu_time": 2.0771142469365615e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0036324266547072e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51576, - "real_time": 1.3637286882233237e+04, - "cpu_time": 2.0784069799906949e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0035299802457780e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3619000257722806e+04, - "cpu_time": 2.0731337606638735e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0075734406132567e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3633417601955985e+04, - "cpu_time": 2.0761581917946292e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0043824076894319e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8463650528154325e+01, - "cpu_time": 6.1634297363464761e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3002683755535365e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0899955936202947e-03, - "cpu_time": 2.9730014788687726e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0948011744208266e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50322, - "real_time": 1.3798449863577252e+04, - "cpu_time": 2.1236514148881161e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 5.9368987683347070e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50322, - "real_time": 1.3811272590445869e+04, - "cpu_time": 2.1222058562855207e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 5.9313868047662199e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50322, - "real_time": 1.3793247698380748e+04, - "cpu_time": 2.1298020507929061e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 5.9391378877084148e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50322, - "real_time": 1.3810728769636104e+04, - "cpu_time": 2.1340698799729616e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 5.9316203631561506e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50322, - "real_time": 1.3777194034978558e+04, - "cpu_time": 2.1381403879019137e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 5.9460583767649245e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3798178591403708e+04, - "cpu_time": 2.1295739179682838e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 5.9370204401460838e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3798449863577252e+04, - "cpu_time": 2.1298020507929061e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 5.9368987683347070e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4086329252794323e+01, - "cpu_time": 6.7641426240481351e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0638553247913159e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0208832390073666e-03, - "cpu_time": 3.1762891942729338e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0213633902601338e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49547, - "real_time": 1.4118803353911655e+04, - "cpu_time": 2.2180979009829094e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.1604382885225728e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49547, - "real_time": 1.4261388916744452e+04, - "cpu_time": 2.2408044503198933e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.1488362105294924e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49547, - "real_time": 1.4237295107339834e+04, - "cpu_time": 2.2339299553958965e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.1507803888642766e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49547, - "real_time": 1.4261502487993177e+04, - "cpu_time": 2.2314195248955541e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.1488270617905629e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49547, - "real_time": 1.4108478324423633e+04, - "cpu_time": 2.2155082063495243e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.1612875338679962e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4197493638082553e+04, - "cpu_time": 2.2279520075887558e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.1540338967149801e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4237295107339834e+04, - "cpu_time": 2.2314195248955544e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.1507803888642766e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7265424585996286e+01, - "cpu_time": 1.0780728485271615e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2917380611719685e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4421876533717111e-03, - "cpu_time": 4.8388513076362298e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4519525631627815e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 47214, - "real_time": 1.4879928993340669e+04, - "cpu_time": 2.3958850277460191e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.2021610462432261e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 47214, - "real_time": 1.4875616734282377e+04, - "cpu_time": 2.4022779620451500e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.2027994257530713e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 47214, - "real_time": 1.4814705222423083e+04, - "cpu_time": 2.3909495467446086e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.2118563621774507e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 47214, - "real_time": 1.4818709830845966e+04, - "cpu_time": 2.3869183060109364e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.2112586300726118e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 47214, - "real_time": 1.4838393142940069e+04, - "cpu_time": 2.3917259414580418e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.2083253681407294e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4845470784766430e+04, - "cpu_time": 2.3935513568009512e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.2072801664774184e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4838393142940065e+04, - "cpu_time": 2.3917259414580414e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.2083253681407294e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0858175194175153e+01, - "cpu_time": 5.8244866445699948e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5865187118772333e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0786255715002345e-03, - "cpu_time": 2.4334078431283734e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0779050985615583e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 40826, - "real_time": 1.6655007561218190e+04, - "cpu_time": 2.8376005168275118e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.9349126536935973e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 40826, - "real_time": 1.6662920323938775e+04, - "cpu_time": 2.8361932371528070e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.9330440718634262e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 40826, - "real_time": 1.7221535875586982e+04, - "cpu_time": 2.8890282565032041e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.8054677860006065e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 40826, - "real_time": 1.7020580796392260e+04, - "cpu_time": 2.8736632366629128e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.8503973973609195e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 40826, - "real_time": 1.6805612904586073e+04, - "cpu_time": 2.8493063709400918e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.8996495023466792e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6873131492344452e+04, - "cpu_time": 2.8571583236173057e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.8846942822530460e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6805612904586069e+04, - "cpu_time": 2.8493063709400914e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.8996495023466792e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4466939728546805e+02, - "cpu_time": 2.3301290707422135e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5982942972153224e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4500532838049505e-02, - "cpu_time": 8.1554076002066048e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4411157971402636e-02, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 35095, - "real_time": 1.9975639513666567e+04, - "cpu_time": 3.6695036557914420e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.5615921788298979e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 35095, - "real_time": 1.9885085648935510e+04, - "cpu_time": 3.6357721384812736e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.5914727406274242e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 35095, - "real_time": 1.9964696663269748e+04, - "cpu_time": 3.6701273628722003e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.5651886532862301e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 35095, - "real_time": 1.9929903344682229e+04, - "cpu_time": 3.6530998546801646e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.5766500586152172e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 35095, - "real_time": 1.9898953936944865e+04, - "cpu_time": 3.5999631514460729e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.5868789090791674e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9930855821499783e+04, - "cpu_time": 3.6456932326542308e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.5763565080875883e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9929903344682229e+04, - "cpu_time": 3.6530998546801653e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.5766500586152172e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9573753304519713e+01, - "cpu_time": 2.9191135025073629e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3057698686748749e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9855521337839781e-03, - "cpu_time": 8.0070190118056508e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9855521322012302e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 29537, - "real_time": 2.3694661690657071e+04, - "cpu_time": 4.9952309747096944e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1063420251463846e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 29537, - "real_time": 2.3691333689518771e+04, - "cpu_time": 4.9621267190303617e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1064974367229252e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 29537, - "real_time": 2.3680747889745449e+04, - "cpu_time": 4.9774011510986318e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1069920646953768e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 29537, - "real_time": 2.3671143419944528e+04, - "cpu_time": 4.9751365880082965e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1074412222061316e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 29537, - "real_time": 2.3688962868969942e+04, - "cpu_time": 4.9867550834546651e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1066081763477335e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3685369911767153e+04, - "cpu_time": 4.9793301032603296e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1067761850237104e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3688962868969942e+04, - "cpu_time": 4.9774011510986325e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1066081763477335e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4679630673641206e+00, - "cpu_time": 1.2502308779866603e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4252141622118130e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.9973887267263377e-04, - "cpu_time": 2.5108415229752349e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9982918155372234e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 20203, - "real_time": 3.4650176731843450e+04, - "cpu_time": 7.3905771766569480e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.5130889636074503e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 20203, - "real_time": 3.4657723620469842e+04, - "cpu_time": 7.4117631638865700e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.5127594810939646e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 20203, - "real_time": 3.4646981458664792e+04, - "cpu_time": 7.3870178636836426e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.5132285062855942e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 20203, - "real_time": 3.4693106967712120e+04, - "cpu_time": 7.4108546206008526e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.5112166243511711e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 20203, - "real_time": 3.4672253574392598e+04, - "cpu_time": 7.3661698807107678e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.5121255354085669e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4664048470616559e+04, - "cpu_time": 7.3932765411077562e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.5124838221493494e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4657723620469842e+04, - "cpu_time": 7.3905771766569465e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.5127594810939646e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8943546023390205e+01, - "cpu_time": 1.8920707900371826e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2627146697632009e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4648971655598603e-04, - "cpu_time": 2.5591776251259880e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4630102806794208e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 12625, - "real_time": 5.5517649586084255e+04, - "cpu_time": 1.2279796744554563e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8887254914747513e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 12625, - "real_time": 5.5582090171450509e+04, - "cpu_time": 1.2245718106930668e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8865357469744747e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 12625, - "real_time": 5.5574984751620999e+04, - "cpu_time": 1.2271627999999929e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8867769459341423e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 12625, - "real_time": 5.5525695301401014e+04, - "cpu_time": 1.2244084308910898e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8884518137200932e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 12625, - "real_time": 5.5555832405150453e+04, - "cpu_time": 1.2261762526732622e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8874273943968285e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5551250443141456e+04, - "cpu_time": 1.2260597937425735e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8875834785000580e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5555832405150446e+04, - "cpu_time": 1.2261762526732622e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.8874273943968285e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8798799788759300e+01, - "cpu_time": 1.5698105188034907e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7862123256426435e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.1841856950161404e-04, - "cpu_time": 1.2803702778733251e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1845189561730651e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7248, - "real_time": 9.6243652110317955e+04, - "cpu_time": 2.1791016956401744e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.1790029305996918e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7248, - "real_time": 9.6242176138949260e+04, - "cpu_time": 2.1684709616445893e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.1790363478193230e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7248, - "real_time": 9.6311357810115631e+04, - "cpu_time": 2.1788178449227428e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.1774711183437756e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7248, - "real_time": 9.6281731544218870e+04, - "cpu_time": 2.1705055974061831e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.1781411347352539e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7248, - "real_time": 9.6276484023804107e+04, - "cpu_time": 2.1726458692053054e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.1782598536538628e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6271080325481176e+04, - "cpu_time": 2.1739083937637991e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.1783822770303818e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6276484023804122e+04, - "cpu_time": 2.1726458692053054e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.1782598536538628e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8951179427801815e+01, - "cpu_time": 4.8428234125861235e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5505089147760114e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0072561074334360e-04, - "cpu_time": 2.2277035345548736e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0070520605344841e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3813, - "real_time": 1.8357034682521780e+05, - "cpu_time": 4.2909884552845248e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.2848483279238491e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3813, - "real_time": 1.8353737418510145e+05, - "cpu_time": 4.2625442774717812e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.2852588028038109e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3813, - "real_time": 1.8358819036993181e+05, - "cpu_time": 4.2637528901127534e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.2846262559418667e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3813, - "real_time": 1.8354852860403893e+05, - "cpu_time": 4.2643559874114738e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.2851199254493534e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3813, - "real_time": 1.8357622793996782e+05, - "cpu_time": 4.2621766850249324e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.2847751296925003e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8356413358485157e+05, - "cpu_time": 4.2687636590610928e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.2849256883622761e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8357034682521780e+05, - "cpu_time": 4.2637528901127528e+05, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.2848483279238491e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0755647402230917e+01, - "cpu_time": 1.2455379122251538e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5836292529076226e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1307027683943895e-04, - "cpu_time": 2.9177954361125432e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1307279121009151e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1994, - "real_time": 3.5091578963804903e+05, - "cpu_time": 8.7652850601805793e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.3904903249444553e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1994, - "real_time": 3.5093890028338274e+05, - "cpu_time": 8.8224933299899776e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.3903329021736290e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1994, - "real_time": 3.5096906344072352e+05, - "cpu_time": 8.8196532998996566e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.3901274709976772e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1994, - "real_time": 3.5094931681286416e+05, - "cpu_time": 8.7911928686057520e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.3902619546836266e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1994, - "real_time": 3.5095378146306012e+05, - "cpu_time": 8.8155828786358540e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.3902315470229374e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5094537032761594e+05, - "cpu_time": 8.8028414874623646e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.3902888399644653e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5094931681286410e+05, - "cpu_time": 8.8155828786358540e+05, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.3902619546836266e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9777286282482969e+01, - "cpu_time": 2.4379040960243474e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3470608042104114e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.6354315955273612e-05, - "cpu_time": 2.7694513180733567e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6355565975467513e-05, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1024, - "real_time": 6.8427680560034793e+05, - "cpu_time": 1.7584346923828071e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4518171393052799e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1024, - "real_time": 6.8385319087838067e+05, - "cpu_time": 1.7629425781249958e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4533359241111927e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1024, - "real_time": 6.8385708868845541e+05, - "cpu_time": 1.7627120683593734e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4533219407254242e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1024, - "real_time": 6.8426568236645835e+05, - "cpu_time": 1.7520782431640625e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4518569953673294e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1024, - "real_time": 6.8402767544739624e+05, - "cpu_time": 1.7477040839843778e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4527101171786167e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8405608859620779e+05, - "cpu_time": 1.7567743332031232e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4526084233375687e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8402767544739624e+05, - "cpu_time": 1.7584346923828069e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4527101171786167e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0869912424074286e+02, - "cpu_time": 6.7153447296735594e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4824469310192904e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0509066101440125e-04, - "cpu_time": 3.8225426013764013e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0508118865697265e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 518, - "real_time": 1.3490489445371430e+06, - "cpu_time": 3.1198733146718070e+06, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4872657241885677e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 518, - "real_time": 1.3496332791090931e+06, - "cpu_time": 3.4872047451737332e+06, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4861888425091019e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 518, - "real_time": 1.3491453654150763e+06, - "cpu_time": 3.1481712200772227e+06, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4870879639924263e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 518, - "real_time": 1.3491554117427140e+06, - "cpu_time": 3.4759415617760862e+06, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4870694441834164e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 518, - "real_time": 1.3492518674553477e+06, - "cpu_time": 3.4907580096525331e+06, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4868916478346439e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3492469736518748e+06, - "cpu_time": 3.3443897702702763e+06, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4869007245416317e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3491554117427138e+06, - "cpu_time": 3.4759415617760858e+06, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4870694441834164e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2758471068356818e+02, - "cpu_time": 1.9237659075319106e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1940674816125692e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6867535382909690e-04, - "cpu_time": 5.7522180118869386e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6864635730023323e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 261, - "real_time": 2.6826534341749558e+06, - "cpu_time": 6.9875153448275356e+06, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5015853015184265e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 261, - "real_time": 2.6829316739306939e+06, - "cpu_time": 7.0195267088122601e+06, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5013258687158642e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 261, - "real_time": 2.6821377874491201e+06, - "cpu_time": 6.6247493754790155e+06, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5020662366427010e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 261, - "real_time": 2.6829359014572082e+06, - "cpu_time": 6.9878346436781352e+06, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5013219273539307e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 261, - "real_time": 2.6824712276929752e+06, - "cpu_time": 7.0353696704980666e+06, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5017552213492374e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6826260049409908e+06, - "cpu_time": 6.9309991486590030e+06, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5016109111160324e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6826534341749558e+06, - "cpu_time": 6.9878346436781362e+06, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5015853015184265e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3635325544601767e+02, - "cpu_time": 1.7244101327110577e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1367316044570981e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2538209009623627e-04, - "cpu_time": 2.4879676013878801e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2538846830731650e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 131, - "real_time": 5.3476227433171887e+06, - "cpu_time": 1.3999707854961684e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.5098578273444786e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 131, - "real_time": 5.3501096340820538e+06, - "cpu_time": 1.3503937290076287e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.5086911704572659e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 131, - "real_time": 5.3470122222681995e+06, - "cpu_time": 1.3384541061068531e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.5101444025326153e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 131, - "real_time": 5.3500597336763190e+06, - "cpu_time": 1.4046235312977055e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.5087145692067188e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 131, - "real_time": 5.3472480885968860e+06, - "cpu_time": 1.3952985511450442e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.5100336804312855e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3484104843881298e+06, - "cpu_time": 1.3777481406106800e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.5094883299944729e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3476227433171896e+06, - "cpu_time": 1.3952985511450443e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.5098578273444786e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5438563569808107e+03, - "cpu_time": 3.0888648651025502e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2431616861367933e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8865704333788265e-04, - "cpu_time": 2.2419662738455422e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8863101691143332e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 66, - "real_time": 1.0676541506792560e+07, - "cpu_time": 2.7974617409090761e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.5142547877439312e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 66, - "real_time": 1.0677353634188572e+07, - "cpu_time": 2.6962332712120984e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.5140635516695595e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 66, - "real_time": 1.0677305445300810e+07, - "cpu_time": 2.7131394393939335e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.5140748981583282e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 66, - "real_time": 1.0676828114259424e+07, - "cpu_time": 2.7009475348484877e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.5141872953961990e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 66, - "real_time": 1.0677754173450397e+07, - "cpu_time": 2.7965025484848835e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.5139692452130882e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0677156574798353e+07, - "cpu_time": 2.7408569069696955e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.5141099556362213e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0677305445300812e+07, - "cpu_time": 2.7131394393939335e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.5140748981583282e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7547712676981666e+02, - "cpu_time": 5.1606272644630505e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1195931786859010e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.4532186396151680e-05, - "cpu_time": 1.8828517648404580e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4532387144641669e-05, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33, - "real_time": 2.1335824533845440e+07, - "cpu_time": 5.6062930121211961e+07, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.5162885603429626e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33, - "real_time": 2.1336251248915989e+07, - "cpu_time": 5.4425615606060192e+07, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.5162382357457302e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33, - "real_time": 2.1335674449801445e+07, - "cpu_time": 5.6017643969697289e+07, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.5163062609675140e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33, - "real_time": 2.1335824816064402e+07, - "cpu_time": 5.6141968303029791e+07, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.5162885270588337e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33, - "real_time": 2.1335567996808976e+07, - "cpu_time": 5.4153427060606077e+07, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.5163188159804150e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1335828609087251e+07, - "cpu_time": 5.5360317012121066e+07, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.5162880800190914e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1335824533845440e+07, - "cpu_time": 5.6017643969697297e+07, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.5162885603429626e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5997057369630966e+02, - "cpu_time": 9.8323099070837663e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0659914572614193e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2184695446305951e-05, - "cpu_time": 1.7760573706489063e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2184580460430258e-05, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 16, - "real_time": 4.2654158081859350e+07, - "cpu_time": 1.1257115531249973e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.5173204027127621e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 16, - "real_time": 4.2658088263124228e+07, - "cpu_time": 1.1246058049999875e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.5170884765790028e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 16, - "real_time": 4.2654907796531916e+07, - "cpu_time": 1.1248270693750051e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.5172761575803974e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 16, - "real_time": 4.2654314544051886e+07, - "cpu_time": 1.1186942206250094e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.5173111688175812e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 16, - "real_time": 4.2655004421249032e+07, - "cpu_time": 1.1271927299999973e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.5172704552929420e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2655294621363282e+07, - "cpu_time": 1.1242062756249993e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.5172533321965370e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2654907796531916e+07, - "cpu_time": 1.1248270693750051e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.5172761575803974e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6039449389435651e+03, - "cpu_time": 3.2447083462921774e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4650820142247051e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_GPUToPinned/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7602481782888741e-05, - "cpu_time": 2.8862215205908638e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7600832197391686e-05, - "hip_id": NaN, - "numa_id": NaN - } - ] -} diff --git a/results/hipMemcpyAsync_PageableToGPU.json b/results/hipMemcpyAsync_PageableToGPU.json deleted file mode 100644 index 5da718f..0000000 --- a/results/hipMemcpyAsync_PageableToGPU.json +++ /dev/null @@ -1,15326 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:05:43-04:00", - "host_name": "frontier10341", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1827, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [0.38,0.35,3.05], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 101391, - "real_time": 6.8832135380240470e+03, - "cpu_time": 7.2836224173479617e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7191930569320895e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 101391, - "real_time": 6.8831901123572707e+03, - "cpu_time": 7.2776635869976056e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7192057145190232e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 101391, - "real_time": 6.8815539094073747e+03, - "cpu_time": 7.2929069942424619e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7200900170241661e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 101391, - "real_time": 6.8839979062861476e+03, - "cpu_time": 7.2996353076306963e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7187692890817516e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 101391, - "real_time": 6.8807073345413510e+03, - "cpu_time": 7.2980100856532168e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7205477221051469e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8825325601232398e+03, - "cpu_time": 7.2903676783743882e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7195611599324360e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8831901123572707e+03, - "cpu_time": 7.2929069942424631e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7192057145190232e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3539341607010642e+00, - "cpu_time": 9.4556325833544414e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3176079382199750e+03, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9672034223937193e-04, - "cpu_time": 1.2970035258170771e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9673309897538815e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 101632, - "real_time": 6.8833271613560100e+03, - "cpu_time": 7.2831583630834901e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4382633281538859e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 101632, - "real_time": 6.8800538991193253e+03, - "cpu_time": 7.2689925844951665e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4418021647408620e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 101632, - "real_time": 6.8776049510008643e+03, - "cpu_time": 7.2875970072851241e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4444520097870871e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 101632, - "real_time": 6.8815903366087359e+03, - "cpu_time": 7.2941785835706663e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4401406499927580e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 101632, - "real_time": 6.8833082273653345e+03, - "cpu_time": 7.3055121075360525e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4382837886655822e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8811769150900536e+03, - "cpu_time": 7.2878877291941011e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4405883882680342e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8815903366087350e+03, - "cpu_time": 7.2875970072851253e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4401406499927580e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4164571536953048e+00, - "cpu_time": 1.3506215948210873e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6133492925745690e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5116916532056358e-04, - "cpu_time": 1.8532414946661642e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5122884860761466e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100747, - "real_time": 6.9217955489801152e+03, - "cpu_time": 7.2625362894242978e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4793849265757066e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100747, - "real_time": 6.9471354139926707e+03, - "cpu_time": 7.2736093697190452e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4739888298959827e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100747, - "real_time": 6.9219968121989623e+03, - "cpu_time": 7.2513956090677404e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4793419121421096e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100747, - "real_time": 6.9462243846049150e+03, - "cpu_time": 7.2690350772906268e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4741821503340954e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100747, - "real_time": 6.9246305006402572e+03, - "cpu_time": 7.2694550711015558e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4787792646919137e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9323565320833850e+03, - "cpu_time": 7.2652062833206534e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4771354167279616e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9246305006402572e+03, - "cpu_time": 7.2690350772906268e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4787792646919137e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3127094176459869e+01, - "cpu_time": 8.6773744969125628e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7952613376033376e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8935976699563626e-03, - "cpu_time": 1.1943741386715948e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8923527971424507e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 99696, - "real_time": 7.0134417029681144e+03, - "cpu_time": 7.2563256637428439e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9201069699250209e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 99696, - "real_time": 7.0167152805706191e+03, - "cpu_time": 7.2431951106793475e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9187446235291034e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 99696, - "real_time": 7.0146015609048018e+03, - "cpu_time": 7.2556992092616868e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9196241329148734e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 99696, - "real_time": 7.0156757197062589e+03, - "cpu_time": 7.2345733066593945e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9191771139697832e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 99696, - "real_time": 7.0102073833546483e+03, - "cpu_time": 7.2424339343158472e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9214542281058091e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0141283295008889e+03, - "cpu_time": 7.2464454449318242e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9198214136889184e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0146015609048000e+03, - "cpu_time": 7.2431951106793475e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9196241329148734e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5077856203292166e+00, - "cpu_time": 9.3655677273045364e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0441676302203588e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5753346709977655e-04, - "cpu_time": 1.2924361051879349e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5761352571942124e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 96318, - "real_time": 7.2715229882754275e+03, - "cpu_time": 7.1284072239173138e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6329327523331392e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 96318, - "real_time": 7.2637745524600678e+03, - "cpu_time": 7.1014859489183414e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6389415315936291e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 96318, - "real_time": 7.2708004800537037e+03, - "cpu_time": 7.1409159461823308e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6334925036613667e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 96318, - "real_time": 7.2724851450131036e+03, - "cpu_time": 7.1015756229565668e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6321875099445391e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 96318, - "real_time": 7.2729789290610734e+03, - "cpu_time": 7.1440497530179262e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6318051240783477e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2703124189726750e+03, - "cpu_time": 7.1232868989984965e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6338718843222046e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2715229882754284e+03, - "cpu_time": 7.1284072239173138e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6329327523331392e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7509463699712158e+00, - "cpu_time": 2.0704818706262945e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9084289986176387e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.1592643531833801e-04, - "cpu_time": 2.9066383257950702e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1623981842951398e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 76950, - "real_time": 9.1016529673389869e+03, - "cpu_time": 6.4125409891139269e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.0005628970877600e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 76950, - "real_time": 9.0394521733708898e+03, - "cpu_time": 6.3790720360982823e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.0624960925537276e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 76950, - "real_time": 9.0727790614569039e+03, - "cpu_time": 6.4149996028094625e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.0292069767259729e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 76950, - "real_time": 9.0905429992215850e+03, - "cpu_time": 6.3946022714386475e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.0115628964094603e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 76950, - "real_time": 9.1010498345801061e+03, - "cpu_time": 6.4221199957488120e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.0011593705089879e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0810954071936958e+03, - "cpu_time": 6.4046669790418267e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.0209976466571808e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0905429992215832e+03, - "cpu_time": 6.4125409891139269e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.0115628964094603e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6045009004561770e+01, - "cpu_time": 1.7534041063583076e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5930989254712206e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8680470622442652e-03, - "cpu_time": 2.7376975447685600e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8745145792517957e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 71214, - "real_time": 9.8288677364313953e+03, - "cpu_time": 6.1999552916587448e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6669264903495996e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 71214, - "real_time": 9.8260664630183692e+03, - "cpu_time": 6.1690916029448724e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6674017076582203e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 71214, - "real_time": 9.8312995963441426e+03, - "cpu_time": 6.2225834676590300e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6665141611687369e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 71214, - "real_time": 9.8282672740485523e+03, - "cpu_time": 6.1799529594162047e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6670283319687283e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 71214, - "real_time": 9.8287645411260382e+03, - "cpu_time": 6.1849234735099447e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6669439919376640e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8286531221937003e+03, - "cpu_time": 6.1913013590377593e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6669629366165900e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8287645411260364e+03, - "cpu_time": 6.1849234735099435e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6669439919376640e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8642681808305432e+00, - "cpu_time": 2.0713508473029789e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1618159744045825e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8967687206509627e-04, - "cpu_time": 3.3455823375150716e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8967524141970868e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65436, - "real_time": 1.0702317257733945e+04, - "cpu_time": 6.0085641069241750e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0617668315074916e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65436, - "real_time": 1.0697540117576669e+04, - "cpu_time": 5.9920447637640011e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0631341074533858e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65436, - "real_time": 1.0695315493146962e+04, - "cpu_time": 6.0088095880269742e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0637712390060997e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65436, - "real_time": 1.0696274031581914e+04, - "cpu_time": 5.9857337200108433e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0634966814844975e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65436, - "real_time": 1.0701570458494207e+04, - "cpu_time": 6.0015443958464932e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0619804940863523e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0698603471706740e+04, - "cpu_time": 5.9993393149144971e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0628298707075653e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0697540117576671e+04, - "cpu_time": 6.0015443958464932e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.0631341074533858e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1608160965725620e+00, - "cpu_time": 1.0222132012184173e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0482924939460261e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9544193360671588e-04, - "cpu_time": 1.7038762896393798e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9542262795862438e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 56001, - "real_time": 1.2474600264486029e+04, - "cpu_time": 5.7444350403202879e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2535551128299170e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 56001, - "real_time": 1.2479256499438323e+04, - "cpu_time": 5.7487078433301461e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2515949169687872e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 56001, - "real_time": 1.2463638488247168e+04, - "cpu_time": 5.7350523399519670e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2581756171601467e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 56001, - "real_time": 1.2461678599760717e+04, - "cpu_time": 5.7427741474294806e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2590025874410210e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 56001, - "real_time": 1.2480424912036558e+04, - "cpu_time": 5.7535397741248631e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2511032646648741e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2471919752793758e+04, - "cpu_time": 5.7449018290313482e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2546862998129501e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2474600264486025e+04, - "cpu_time": 5.7444350403202879e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.2535551128299170e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7580147004177213e+00, - "cpu_time": 6.9075537654859177e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6905300142716630e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.0221865390497661e-04, - "cpu_time": 1.2023797744600633e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0233117710624020e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 44954, - "real_time": 1.5570322001624018e+04, - "cpu_time": 5.4155702783158743e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4180661123340225e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 44954, - "real_time": 1.5567311346595274e+04, - "cpu_time": 5.3988865154220462e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4196941322604656e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 44954, - "real_time": 1.5574241228749710e+04, - "cpu_time": 5.4524614054208958e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4159477225795088e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 44954, - "real_time": 1.5566706794679476e+04, - "cpu_time": 5.4032071859205699e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4200211212816648e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 44954, - "real_time": 1.5570461523521220e+04, - "cpu_time": 5.4167785188102865e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4179906807514076e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5569808579033943e+04, - "cpu_time": 5.4173807807779348e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4183439538414145e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5570322001624018e+04, - "cpu_time": 5.4155702783158755e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.4180661123340225e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0081372411736669e+00, - "cpu_time": 2.1078540664433767e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6263297952383459e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9320322571109687e-04, - "cpu_time": 3.8909099281381671e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9318880342210628e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 35495, - "real_time": 1.9723436549717331e+04, - "cpu_time": 5.3878092180714750e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3290990104042339e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 35495, - "real_time": 1.9720745215069102e+04, - "cpu_time": 5.3728590838341129e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3292803955485891e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 35495, - "real_time": 1.9725746003490709e+04, - "cpu_time": 5.3804046056245291e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3289434019560549e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 35495, - "real_time": 1.9719958163029311e+04, - "cpu_time": 5.3721997128953385e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3293334490509405e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 35495, - "real_time": 1.9721247229598866e+04, - "cpu_time": 5.3825436642507362e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3292465580298494e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9722226632181068e+04, - "cpu_time": 5.3791632569352400e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3291805629979336e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9721247229598870e+04, - "cpu_time": 5.3804046056245291e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3292465580298494e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3531709151382918e+00, - "cpu_time": 6.6323881111275242e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5858137817537088e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1931568169379953e-04, - "cpu_time": 1.2329776573664181e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1930762651064844e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 22745, - "real_time": 3.0776497849898456e+04, - "cpu_time": 5.1923099526234138e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7035336592130474e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 22745, - "real_time": 3.0770789758224681e+04, - "cpu_time": 5.1855789041886455e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7038496708062679e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 22745, - "real_time": 3.0771133711646755e+04, - "cpu_time": 5.1980252169316763e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7038306255240736e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 22745, - "real_time": 3.0774971735143052e+04, - "cpu_time": 5.1919315263507980e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7036181365563906e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 22745, - "real_time": 3.0774256068737206e+04, - "cpu_time": 5.1910043651659685e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7036577548095827e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0773529824730031e+04, - "cpu_time": 5.1917699930521011e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7036979693818726e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0774256068737206e+04, - "cpu_time": 5.1919315263507986e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7036577548095827e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4831950638948475e+00, - "cpu_time": 4.4260942850547965e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3747663008962651e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0692565267547484e-05, - "cpu_time": 8.5252125787121306e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0693076214386237e-05, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 13294, - "real_time": 5.2697902649681113e+04, - "cpu_time": 5.2249273284225696e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9897869692663097e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 13294, - "real_time": 5.2695674484535877e+04, - "cpu_time": 5.2312670451031107e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9898711047103420e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 13294, - "real_time": 5.2714376618794471e+04, - "cpu_time": 5.2262932515811300e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9891651334185501e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 13294, - "real_time": 5.2694081461670190e+04, - "cpu_time": 5.2271069954378331e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9899312615644260e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 13294, - "real_time": 5.2692677383010727e+04, - "cpu_time": 5.2321397542297572e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9899842863898273e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2698942519538476e+04, - "cpu_time": 5.2283468749548799e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9897477510698910e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2695674484535877e+04, - "cpu_time": 5.2271069954378337e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9898711047103420e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8438484129024015e+00, - "cpu_time": 3.1765270171865739e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3384973397742882e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6781832784639817e-04, - "cpu_time": 6.0755858269522086e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6778495354394406e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7654, - "real_time": 9.1562330388719362e+04, - "cpu_time": 5.0718666077462524e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2904091574523453e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7654, - "real_time": 9.1422632890395413e+04, - "cpu_time": 5.0712631572040826e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2939089957234436e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7654, - "real_time": 9.1577222157901051e+04, - "cpu_time": 5.0736712377176052e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2900367040878441e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7654, - "real_time": 9.1496049839896659e+04, - "cpu_time": 5.0725626994054937e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2920683501306099e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7654, - "real_time": 9.1446112857155429e+04, - "cpu_time": 5.0698742236060029e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2933200050568394e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1500869626813583e+04, - "cpu_time": 5.0718475851358873e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2919486424902161e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1496049839896645e+04, - "cpu_time": 5.0718666077462518e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2920683501306099e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8464690435449569e+01, - "cpu_time": 1.4206662846229406e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7148959627844483e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.4824087153141708e-04, - "cpu_time": 2.8010823684578007e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4822617356783507e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4017, - "real_time": 1.7425761721233142e+05, - "cpu_time": 4.9151879122554475e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4069559007508270e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4017, - "real_time": 1.7444207502565192e+05, - "cpu_time": 4.9140932142121673e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4044107474548340e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4017, - "real_time": 1.7432378120987589e+05, - "cpu_time": 4.9106986333258677e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4060423488349518e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4017, - "real_time": 1.7442885363438091e+05, - "cpu_time": 4.9179079442742801e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4045929974358780e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4017, - "real_time": 1.7429346882058054e+05, - "cpu_time": 4.9139473601418501e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4064607976318714e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7434915918056414e+05, - "cpu_time": 4.9143670128419226e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4056925584216724e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7432378120987589e+05, - "cpu_time": 4.9140932142121679e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4060423488349518e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2325496931373124e+01, - "cpu_time": 2.5942317566836681e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1358534651631786e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7218751910419588e-04, - "cpu_time": 5.2788726399647832e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7215237923352505e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2061, - "real_time": 3.3944288959156419e+05, - "cpu_time": 4.8628747069918007e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4712869991454590e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2061, - "real_time": 3.3943976909891475e+05, - "cpu_time": 4.8681254121008945e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4713097178532166e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2061, - "real_time": 3.3959667002357455e+05, - "cpu_time": 4.8615527415477914e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4701679199085396e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2061, - "real_time": 3.3943201619716006e+05, - "cpu_time": 4.8622901869529355e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4713661645657650e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2061, - "real_time": 3.3948861067836283e+05, - "cpu_time": 4.8714117211790258e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4709541752337334e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3947999111791526e+05, - "cpu_time": 4.8652509537544888e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4710169953413429e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3944288959156419e+05, - "cpu_time": 4.8628747069918013e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4712869991454590e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8891565127864197e+01, - "cpu_time": 4.3100762258374848e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0134397446862767e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0293262321883162e-04, - "cpu_time": 8.8588980646752053e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0288973139959027e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1042, - "real_time": 6.7178899960345705e+05, - "cpu_time": 4.8210122745105827e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4973936771669735e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1042, - "real_time": 6.7177456438285788e+05, - "cpu_time": 4.8289281563147855e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4974473416409863e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1042, - "real_time": 6.7149712427049130e+05, - "cpu_time": 4.8237056245585269e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4984792032023403e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1042, - "real_time": 6.7183692567988927e+05, - "cpu_time": 4.8208986555662155e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4972155233982857e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1042, - "real_time": 6.7160889024143736e+05, - "cpu_time": 4.8249874631189430e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4980634181255016e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7170130083562655e+05, - "cpu_time": 4.8239064348138106e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4977198327068176e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7177456438285788e+05, - "cpu_time": 4.8237056245585263e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.4974473416409863e+10, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4289900870814608e+02, - "cpu_time": 3.3109490197259450e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3142524920669701e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1274189662931023e-04, - "cpu_time": 6.8636261181001502e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1276415482948032e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 70, - "real_time": 9.7514665419501923e+06, - "cpu_time": 6.9276807379999685e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4409626342510595e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 70, - "real_time": 9.7755970300308298e+06, - "cpu_time": 6.9318396921427894e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4324688197477980e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 70, - "real_time": 9.7856407585952971e+06, - "cpu_time": 6.9412097684285903e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4289458225336132e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 70, - "real_time": 9.7389092269752715e+06, - "cpu_time": 6.9264137014285922e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4453993992529902e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 70, - "real_time": 9.7605185583233833e+06, - "cpu_time": 6.9299511062856972e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4377714462092910e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7624264231749941e+06, - "cpu_time": 6.9314190012571263e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4371096243989506e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7605185583233833e+06, - "cpu_time": 6.9299511062856972e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4377714462092910e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8635904296332563e+04, - "cpu_time": 5.8570141043280135e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5610362912210748e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9089418438117849e-03, - "cpu_time": 8.4499495749221730e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9088818828024454e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 37, - "real_time": 1.9139317392900184e+07, - "cpu_time": 7.4161301632431936e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5063352899353838e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 37, - "real_time": 1.9085670343121968e+07, - "cpu_time": 7.4130449381080580e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5161910896247077e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 37, - "real_time": 1.9182415074996047e+07, - "cpu_time": 7.4208961432432485e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4984575058786664e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 37, - "real_time": 1.9188439574193310e+07, - "cpu_time": 7.4277342489189029e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4973591125281110e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 37, - "real_time": 1.9252271164913435e+07, - "cpu_time": 7.4416517748648024e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4857634938314948e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9169622710024990e+07, - "cpu_time": 7.4238914536756420e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5008212983596725e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9182415074996047e+07, - "cpu_time": 7.4208961432432485e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4984575058786664e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1876688317856038e+04, - "cpu_time": 1.1369394197703972e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1302060757649465e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2278511295632788e-03, - "cpu_time": 1.5314601875105369e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2284026502424163e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.7719552454195522e+07, - "cpu_time": 7.9518064710525715e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5583064821086187e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.7875746229761526e+07, - "cpu_time": 7.9823271278948033e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5436325712451863e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.7632276353083156e+07, - "cpu_time": 7.9496637047368777e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5665588427526450e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.7486869253610313e+07, - "cpu_time": 7.9333624152631378e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5803930995670881e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.7652436251703061e+07, - "cpu_time": 7.9477399468420112e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5646492328615041e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7673376108470716e+07, - "cpu_time": 7.9529799331578803e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5627080457070084e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7652436251703061e+07, - "cpu_time": 7.9496637047368777e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5646492328615041e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4141993786207883e+05, - "cpu_time": 1.7929979699535605e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3366052741479063e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7538429647212086e-03, - "cpu_time": 2.2544982950077896e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7516553615963254e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 7.3759940266609192e+07, - "cpu_time": 9.1436034199998915e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6393122747893491e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 7.4049559980630875e+07, - "cpu_time": 9.1490360210001719e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6250783403738604e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 7.3754198104143143e+07, - "cpu_time": 9.1294294910001397e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6395956148958607e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 7.4159944802522659e+07, - "cpu_time": 9.1635879339998782e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6196825215391579e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 7.4050534516572952e+07, - "cpu_time": 9.1483502580001068e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6250306328298349e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3954835534095764e+07, - "cpu_time": 9.1468014248000371e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6297398768856125e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4049559980630875e+07, - "cpu_time": 9.1483502580001068e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6250783403738604e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8603788028236612e+05, - "cpu_time": 1.2259593327879980e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1354210650894474e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5155607329637847e-03, - "cpu_time": 1.3403148006077975e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5168252753494328e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4423488080501556e+08, - "cpu_time": 1.0929790742000136e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7221988814603786e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4405136108398438e+08, - "cpu_time": 1.0915879555999992e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7269409185727525e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4433465003967285e+08, - "cpu_time": 1.0923560807999933e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7196259654381800e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4400748908519745e+08, - "cpu_time": 1.0920196993999979e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7280763341577144e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4442668557167053e+08, - "cpu_time": 1.0933128597999997e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7172556434079652e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4421101331710818e+08, - "cpu_time": 1.0924511339600010e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7228195486073985e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4423488080501556e+08, - "cpu_time": 1.0923560807999933e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7221988814603786e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7977845118309054e+05, - "cpu_time": 7.0027496083199920e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6411401330276597e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2466346851593955e-03, - "cpu_time": 6.4101261746471775e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2466734077303798e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8553931415081024e+08, - "cpu_time": 1.3159162894999809e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7603992542788463e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8564266860485077e+08, - "cpu_time": 1.3177685255000000e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7590386241818137e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8561739623546600e+08, - "cpu_time": 1.3165796574999859e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7593712363192186e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8537715971469879e+08, - "cpu_time": 1.3160098759999955e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7625359544311676e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8524251282215118e+08, - "cpu_time": 1.3169921995000067e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7643120353152914e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8548381030559540e+08, - "cpu_time": 1.3166533095999939e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7611314209052677e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8553931415081024e+08, - "cpu_time": 1.3165796574999859e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7603992542788463e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7011809196020965e+05, - "cpu_time": 7.6177144269919046e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2418261704601450e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.9589400806338961e-04, - "cpu_time": 5.7856645872148428e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9605100688573103e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 101143, - "real_time": 6.9204708956761615e+03, - "cpu_time": 7.2349408145925009e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6991702423016645e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 101143, - "real_time": 6.9217920008940910e+03, - "cpu_time": 7.2129039708989239e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6984642122579291e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 101143, - "real_time": 6.9186296516765087e+03, - "cpu_time": 7.2209746831171882e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7001546966452613e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 101143, - "real_time": 6.9147871474079548e+03, - "cpu_time": 7.1969517861334836e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7022108496277139e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 101143, - "real_time": 6.9160527396295383e+03, - "cpu_time": 7.2123636443281245e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7015333693611011e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9183464870568514e+03, - "cpu_time": 7.2156269798140442e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7003066740387343e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9186296516765096e+03, - "cpu_time": 7.2129039708989239e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7001546966452613e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9323640537742919e+00, - "cpu_time": 1.3860457600646871e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5684311986823011e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2385330935076589e-04, - "cpu_time": 1.9208944197672583e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2386519195459609e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100881, - "real_time": 6.9579157771106211e+03, - "cpu_time": 7.2127755140597880e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3585254033157572e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100881, - "real_time": 6.9595788241537539e+03, - "cpu_time": 7.2116004817977941e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3567670247955889e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100881, - "real_time": 6.9648597435455631e+03, - "cpu_time": 7.2157170089635587e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3511889521462053e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100881, - "real_time": 6.9603731612709043e+03, - "cpu_time": 7.2036792129909480e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3559274501097754e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100881, - "real_time": 6.9657687705762382e+03, - "cpu_time": 7.2105027768201864e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3502296281024158e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9616992553314176e+03, - "cpu_time": 7.2108549989264536e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3545276916939482e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9603731612709043e+03, - "cpu_time": 7.2116004817977941e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3559274501097754e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4321677299940951e+00, - "cpu_time": 4.4581170076738374e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6254712469553524e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9300718174024379e-04, - "cpu_time": 6.1825081884707964e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9295772603451954e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100549, - "real_time": 6.9635280794324835e+03, - "cpu_time": 7.1909079957484055e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4705189500484565e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100549, - "real_time": 6.9648359984010194e+03, - "cpu_time": 7.1901996859192717e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4702428028959891e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100549, - "real_time": 6.9632338986138257e+03, - "cpu_time": 7.1937162898894727e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4705810761345360e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100549, - "real_time": 6.9618127468403418e+03, - "cpu_time": 7.1920003510952306e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4708812736521077e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100549, - "real_time": 6.9627264921763935e+03, - "cpu_time": 7.1921577666730428e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4706882442540410e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9632274430928137e+03, - "cpu_time": 7.1917964178650856e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4705824693970260e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9632338986138257e+03, - "cpu_time": 7.1920003510952306e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4705810761345360e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1102017069198984e+00, - "cpu_time": 1.3413535166889665e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3445803782340241e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5943780610256600e-04, - "cpu_time": 1.8651160833153184e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5943209082285321e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 99359, - "real_time": 7.0477241125739592e+03, - "cpu_time": 7.1408127620180762e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9059026251412565e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 99359, - "real_time": 7.0430845847710807e+03, - "cpu_time": 7.1573318022696364e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9078168455172193e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 99359, - "real_time": 7.0723090647129857e+03, - "cpu_time": 7.1684422714935648e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.8958010478054720e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 99359, - "real_time": 7.0474199799723110e+03, - "cpu_time": 7.1567093057424068e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9060280298607188e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 99359, - "real_time": 7.0489822899090241e+03, - "cpu_time": 7.1539411437604582e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9053839487323099e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0519040063878729e+03, - "cpu_time": 7.1554474570568275e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9041864994113952e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0477241125739583e+03, - "cpu_time": 7.1567093057424068e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9059026251412565e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1621779503221726e+01, - "cpu_time": 9.8799228230862343e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7766467914217815e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6480342745298707e-03, - "cpu_time": 1.3807554150009839e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6447451953894444e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 96740, - "real_time": 7.2352855489432613e+03, - "cpu_time": 7.0695011105305302e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6611449158329833e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 96740, - "real_time": 7.2338364171991661e+03, - "cpu_time": 7.0740564616214275e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6622789952249300e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 96740, - "real_time": 7.2360271317770666e+03, - "cpu_time": 7.0633670219350517e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6605647344968975e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 96740, - "real_time": 7.2339251332365347e+03, - "cpu_time": 7.0782466543204284e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6622095536775422e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 96740, - "real_time": 7.2368922468838646e+03, - "cpu_time": 7.0693795467868602e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6598880572854984e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2351932956079791e+03, - "cpu_time": 7.0709101590388608e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6612172513035703e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2352855489432604e+03, - "cpu_time": 7.0695011105305302e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6611449158329833e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3266106810598171e+00, - "cpu_time": 5.5890627986559877e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0379946396778742e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8335525076643318e-04, - "cpu_time": 7.9043046410530286e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8335184706767121e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 92134, - "real_time": 7.5976074588125648e+03, - "cpu_time": 6.9129500254365420e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0782341736408074e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 92134, - "real_time": 7.5959314546184842e+03, - "cpu_time": 6.9171474555192578e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0784720806056108e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 92134, - "real_time": 7.5969608578464395e+03, - "cpu_time": 6.9061844238138604e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0783259455047712e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 92134, - "real_time": 7.5947105828994154e+03, - "cpu_time": 6.9179616029489720e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0786454481156225e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 92134, - "real_time": 7.5973310366665191e+03, - "cpu_time": 6.9130378782754207e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0782734042341275e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5965082781686842e+03, - "cpu_time": 6.9134562771988106e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0783902104201877e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5969608578464376e+03, - "cpu_time": 6.9130378782754207e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0783259455047712e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1889482467075330e+00, - "cpu_time": 4.6699560405403021e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6879732794093632e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5651246640833736e-04, - "cpu_time": 6.7548789683421161e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5652713304506496e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 86986, - "real_time": 8.0532485548788754e+03, - "cpu_time": 6.7471322680106556e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0344585030936530e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 86986, - "real_time": 8.0504065639193004e+03, - "cpu_time": 6.7466574551020646e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0351767168419294e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 86986, - "real_time": 8.0511955328298600e+03, - "cpu_time": 6.7444104524817586e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0349772817207062e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 86986, - "real_time": 8.0485394708604363e+03, - "cpu_time": 6.7525110358579588e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0356488353344007e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 86986, - "real_time": 8.0520311040854103e+03, - "cpu_time": 6.7470448781629133e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0347661090985036e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0510842453147761e+03, - "cpu_time": 6.7475512179230702e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0350054892178383e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0511955328298591e+03, - "cpu_time": 6.7470448781629133e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0349772817207062e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7697663271882376e+00, - "cpu_time": 2.9872609689393186e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4735485118639318e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1981714179902294e-04, - "cpu_time": 4.4271779086381093e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1982980073352807e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 78440, - "real_time": 8.9262184853402341e+03, - "cpu_time": 6.4698229714859200e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6709834129442110e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 78440, - "real_time": 8.9236577547035304e+03, - "cpu_time": 6.4745786115680456e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6720368374424109e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 78440, - "real_time": 8.9270560275090738e+03, - "cpu_time": 6.4794260990862906e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6706389989067078e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 78440, - "real_time": 8.9218562173252831e+03, - "cpu_time": 6.4771163043698585e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6727783100077400e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 78440, - "real_time": 8.9262380279974896e+03, - "cpu_time": 6.4796465745453203e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6709753758774872e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9250053025751222e+03, - "cpu_time": 6.4761181122110868e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6714825870357118e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9262184853402359e+03, - "cpu_time": 6.4771163043698585e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6709834129442110e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1754034277287158e+00, - "cpu_time": 4.0739437325036136e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9500982859407749e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4374253616421369e-04, - "cpu_time": 6.2907187020291714e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4377340961780024e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 65526, - "real_time": 1.0648693458428526e+04, - "cpu_time": 6.0661068656453264e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.1543700413432150e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 65526, - "real_time": 1.0682980736342734e+04, - "cpu_time": 6.0785613472948444e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.1346174459578714e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 65526, - "real_time": 1.0662438233960220e+04, - "cpu_time": 6.0785739423940539e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.1464365431225348e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 65526, - "real_time": 1.0694320407530939e+04, - "cpu_time": 6.0839051338497341e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.1281126338658752e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 65526, - "real_time": 1.0675037563208047e+04, - "cpu_time": 6.0755753628460991e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.1391821445080910e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0672694079894094e+04, - "cpu_time": 6.0765445304060102e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.1405437617595177e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0675037563208047e+04, - "cpu_time": 6.0785613472948432e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.1391821445080910e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7749770903408109e+01, - "cpu_time": 6.5621771901057579e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0215173035409631e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6631012535856589e-03, - "cpu_time": 1.0799192135052616e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6635616374929255e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50885, - "real_time": 1.3758592221073284e+04, - "cpu_time": 5.6743157690755975e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.5265560526784267e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50885, - "real_time": 1.3760460135893978e+04, - "cpu_time": 5.6732773721072388e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.5252628695242844e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50885, - "real_time": 1.3760500950284200e+04, - "cpu_time": 5.6708452705277777e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.5252346170793247e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50885, - "real_time": 1.3758101779116194e+04, - "cpu_time": 5.6744688192839468e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.5268956506018753e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50885, - "real_time": 1.3760365747913616e+04, - "cpu_time": 5.6705912533134544e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.5253282072007065e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3759604166856254e+04, - "cpu_time": 5.6726996968616033e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.5258554794169235e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3760365747913616e+04, - "cpu_time": 5.6732773721072376e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.5253282072007065e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1616918772492240e+00, - "cpu_time": 1.8681289736388411e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0427476140930841e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4427710504018314e-05, - "cpu_time": 3.2931920839602625e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4430712091649118e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 38644, - "real_time": 1.8115547367903488e+04, - "cpu_time": 5.4174193946335387e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4470664047637768e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 38644, - "real_time": 1.8115290019924265e+04, - "cpu_time": 5.4198609333447289e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4470869619624004e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 38644, - "real_time": 1.8115484536232561e+04, - "cpu_time": 5.4167879070473015e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4470714237628532e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 38644, - "real_time": 1.8116374558653708e+04, - "cpu_time": 5.4184240811151934e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4470003319443447e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 38644, - "real_time": 1.8118635430779275e+04, - "cpu_time": 5.4186621481825197e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4468197729431620e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8116266382698661e+04, - "cpu_time": 5.4182308928646576e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4470089790753077e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8115547367903488e+04, - "cpu_time": 5.4184240811151946e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4470664047637768e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3879518141771583e+00, - "cpu_time": 1.1854400258260302e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1085137546823674e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.6613568428353181e-05, - "cpu_time": 2.1878728486583187e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6607247827221412e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 23663, - "real_time": 2.9583180605874262e+04, - "cpu_time": 5.2134538219596314e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7722502762123333e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 23663, - "real_time": 2.9582511895465115e+04, - "cpu_time": 5.2103991006821716e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7722903377936996e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 23663, - "real_time": 2.9585877649282374e+04, - "cpu_time": 5.2130014408988595e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7720887181885475e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 23663, - "real_time": 2.9583964928999125e+04, - "cpu_time": 5.2109957191620547e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7722032907295551e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 23663, - "real_time": 2.9583735322770361e+04, - "cpu_time": 5.2119371985860699e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7722170452101761e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9583854080478246e+04, - "cpu_time": 5.2119574562577569e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7722099336268627e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9583735322770361e+04, - "cpu_time": 5.2119371985860693e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7722170452101761e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2625617651858552e+00, - "cpu_time": 1.2925589887665550e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5631066801943234e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2677392937081600e-05, - "cpu_time": 2.4799876046851437e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2676132983389142e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 13477, - "real_time": 5.1997156418423590e+04, - "cpu_time": 5.1867734888223225e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0166025841145214e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 13477, - "real_time": 5.1991302384680239e+04, - "cpu_time": 5.1834393817688650e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0168296463159451e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 13477, - "real_time": 5.1979206158054862e+04, - "cpu_time": 5.1828034993716180e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0172989883907825e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 13477, - "real_time": 5.1992846806156667e+04, - "cpu_time": 5.1842328923609394e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0167697374013268e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 13477, - "real_time": 5.1995388065139261e+04, - "cpu_time": 5.1868297702211833e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0166711683858486e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1991179966490934e+04, - "cpu_time": 5.1848158065089875e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0168344249216854e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1992846806156675e+04, - "cpu_time": 5.1842328923609400e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0167697374013268e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0638427761226783e+00, - "cpu_time": 1.8823046916141076e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7405718882306297e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3586617539119956e-04, - "cpu_time": 3.6304176693240938e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3588482298625219e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7644, - "real_time": 9.1370031961040309e+04, - "cpu_time": 5.0084129911420739e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2952295790968033e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7644, - "real_time": 9.1326329539382743e+04, - "cpu_time": 5.0057074669360995e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2963279161412518e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7644, - "real_time": 9.1533554227321409e+04, - "cpu_time": 5.0177175533960849e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2911292123452049e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7644, - "real_time": 9.1374767002720750e+04, - "cpu_time": 5.0108401147462362e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2951106402685062e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7644, - "real_time": 9.1362186967191054e+04, - "cpu_time": 5.0076453024475360e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2954266634982212e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1393373939531259e+04, - "cpu_time": 5.0100646857336062e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2946448022699978e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1370031961040309e+04, - "cpu_time": 5.0084129911420739e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2952295790968033e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0636775061739783e+01, - "cpu_time": 4.6565690090472565e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0225306410463106e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.8230439019672941e-04, - "cpu_time": 9.2944289168701854e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8141338434842033e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4011, - "real_time": 1.7452878236293010e+05, - "cpu_time": 4.8791152066392040e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4032162163820091e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4011, - "real_time": 1.7436710999337866e+05, - "cpu_time": 4.8743519580328637e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4054444672273762e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4011, - "real_time": 1.7431509160195559e+05, - "cpu_time": 4.8723751127525508e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4061622900543774e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4011, - "real_time": 1.7438011186297706e+05, - "cpu_time": 4.8742463933583015e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4052651160676884e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4011, - "real_time": 1.7434740606163113e+05, - "cpu_time": 4.8756385381250817e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4057163193568420e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7438770037657447e+05, - "cpu_time": 4.8751454417816001e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4051608818176590e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7436710999337866e+05, - "cpu_time": 4.8743519580328637e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4054444672273762e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2585322958717740e+01, - "cpu_time": 2.5057336502423772e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1384571165207760e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7357309477894487e-04, - "cpu_time": 5.1398131197633924e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7333927851861895e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2066, - "real_time": 3.3900890662086930e+05, - "cpu_time": 4.8528583798450804e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4744506224378944e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2066, - "real_time": 3.3902540712629509e+05, - "cpu_time": 4.8547754719023544e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4743301899125935e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2066, - "real_time": 3.3902052220471913e+05, - "cpu_time": 4.8558859693853092e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4743658423529007e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2066, - "real_time": 3.3898280899352342e+05, - "cpu_time": 4.8540971467474782e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4746411255799911e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2066, - "real_time": 3.3897700091985764e+05, - "cpu_time": 4.8512286911230332e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4746835263856937e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3900292917305289e+05, - "cpu_time": 4.8537691318006504e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4744942613338150e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3900890662086924e+05, - "cpu_time": 4.8540971467474782e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4744506224378944e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1952214117791904e+01, - "cpu_time": 1.7947578905784132e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6023855240484420e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.4755234331871574e-05, - "cpu_time": 3.6976581329746809e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4756081640080900e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1046, - "real_time": 6.6937279266912502e+05, - "cpu_time": 4.8207348763289839e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5064084145250103e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1046, - "real_time": 6.6925561769836955e+05, - "cpu_time": 4.8222272186998081e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5068472428663891e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1046, - "real_time": 6.6940430877863802e+05, - "cpu_time": 4.8243354903823316e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5062904107400917e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1046, - "real_time": 6.6917638566405524e+05, - "cpu_time": 4.8246182900573057e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5071440593874481e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1046, - "real_time": 6.6929386085501197e+05, - "cpu_time": 4.8213849450956500e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5067040027182354e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6930059313304001e+05, - "cpu_time": 4.8226601641128159e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5066788260474350e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6929386085501197e+05, - "cpu_time": 4.8222272186998081e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5067040027182354e+10, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1467639864189266e+01, - "cpu_time": 1.7436551883484953e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4257443990116953e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3666152518410784e-04, - "cpu_time": 3.6155464598639425e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3666467213166894e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 69, - "real_time": 9.8928793913860247e+06, - "cpu_time": 6.8842938163765788e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3917761121414938e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 69, - "real_time": 9.9174197547245715e+06, - "cpu_time": 6.8847102818842244e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3833832619633713e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 69, - "real_time": 9.8771252196984012e+06, - "cpu_time": 6.8786232708694482e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3971860489407248e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 69, - "real_time": 9.9822014867179636e+06, - "cpu_time": 6.8875750704349780e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3614260385994596e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 69, - "real_time": 9.8909060538247004e+06, - "cpu_time": 6.8863605234785211e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3924528063862138e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9121063812703341e+06, - "cpu_time": 6.8843125926087499e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3852448536062527e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8928793913860247e+06, - "cpu_time": 6.8847102818842256e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3917761121414938e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1786266984040245e+04, - "cpu_time": 3.4410998798355216e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4212719119886948e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2156798340056683e-03, - "cpu_time": 4.9984654728345897e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1984316451279266e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 36, - "real_time": 1.9502318050298426e+07, - "cpu_time": 7.3062961344446993e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4410711499484081e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 36, - "real_time": 1.9333397607422538e+07, - "cpu_time": 7.2704660866666400e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4711365980615511e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 36, - "real_time": 1.9419135836263496e+07, - "cpu_time": 7.2925210374999630e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4558110394737649e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 36, - "real_time": 1.9341069170170359e+07, - "cpu_time": 7.2758843833332145e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4697597847125063e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 36, - "real_time": 1.9403540218869846e+07, - "cpu_time": 7.2847800258335674e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4585886515047894e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9399892176604934e+07, - "cpu_time": 7.2859895335556185e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4592734447402039e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9403540218869846e+07, - "cpu_time": 7.2847800258335686e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.4585886515047894e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8476930546099858e+04, - "cpu_time": 1.4138360554084908e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2190964486418620e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5297583060115551e-03, - "cpu_time": 1.9404859818931528e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5241401644483697e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18, - "real_time": 3.8042982005410723e+07, - "cpu_time": 7.6380392733335924e+, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.6880042011800565e+07, - "cpu_time": 7.8282756673684156e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6393051818393846e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.6982442791524686e+07, - "cpu_time": 7.8160819778946686e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6292283004831376e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.6989609661855198e+07, - "cpu_time": 7.8104904242103076e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6285251244056621e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.6980808761559032e+07, - "cpu_time": 7.8093396678945005e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6293886611673350e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.7016827220979489e+07, - "cpu_time": 7.8109667784212887e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6258571594685826e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6969946089543790e+07, - "cpu_time": 7.8150309031578362e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6304608854728203e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6982442791524686e+07, - "cpu_time": 7.8109667784212887e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6292283004831376e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2300585462489340e+04, - "cpu_time": 7.8430184695151995e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1437333955173064e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/5/log2(N):27/manu, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 7.4983213841915131e+07, - "cpu_time": 9.2329889690000761e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5799406593312263e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 7.4419911950826645e+07, - "cpu_time": 9.2041688409999537e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6070380757420158e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 7.4864832311868668e+07, - "cpu_time": 9.2116240659999561e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5856015128941083e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 7.4355527758598328e+07, - "cpu_time": 9.1933674079997444e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6101613974350233e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 7.4835710227489471e+07, - "cpu_time": 9.2237509470000422e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5869968385947828e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4691839218139663e+07, - "cpu_time": 9.2131800461999547e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5939476967994318e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4835710227489471e+07, - "cpu_time": 9.2116240659999561e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5869968385947828e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8397820590058091e+05, - "cpu_time": 1.5654878570232657e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3678563734380888e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8019977667334498e-03, - "cpu_time": 1.6991829630736055e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8059996662061189e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4589905440807343e+08, - "cpu_time": 1.1027682554000421e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6797422312168999e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4585969448089600e+08, - "cpu_time": 1.1021987082000351e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6807352018025570e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4600231945514679e+08, - "cpu_time": 1.1020370651999884e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6771396098603182e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4586667418479919e+08, - "cpu_time": 1.1008088457999749e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6805590790384078e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4548526704311371e+08, - "cpu_time": 1.1005063108000171e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6902081077453804e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4582260191440585e+08, - "cpu_time": 1.1016638370800116e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6816768459327135e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4586667418479919e+08, - "cpu_time": 1.1020370651999884e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6805590790384078e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9701295460105615e+05, - "cpu_time": 9.6384689479897427e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9811587471189871e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3510453936125605e-03, - "cpu_time": 8.7490109265424862e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3529592507886346e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8961427509784698e+08, - "cpu_time": 1.3249275459999411e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7074892929129043e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8775908052921295e+08, - "cpu_time": 1.3222702269999900e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7313916281123056e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8892794251441956e+08, - "cpu_time": 1.3254376140000374e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7162962317028670e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8946802020072937e+08, - "cpu_time": 1.3258339365000041e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7093625169903812e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8858387470245361e+08, - "cpu_time": 1.3247280384999840e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7207270333697228e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8887063860893255e+08, - "cpu_time": 1.3246394723999915e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7170533406176362e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8892794251441956e+08, - "cpu_time": 1.3249275459999411e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7162962317028670e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4681634858200734e+05, - "cpu_time": 1.3935501978667879e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6212719689986929e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5852968379837067e-03, - "cpu_time": 1.0520222497536961e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5884137480254709e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 99931, - "real_time": 6.9468509649910447e+03, - "cpu_time": 7.2498239925601900e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6851229613262624e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 99931, - "real_time": 6.9526833767164972e+03, - "cpu_time": 7.1933747396647263e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6820316146900341e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 99931, - "real_time": 6.9352506503035056e+03, - "cpu_time": 7.1743148283230615e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6912869182139330e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 99931, - "real_time": 6.9543363953414873e+03, - "cpu_time": 7.1790349418671381e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6811564101427011e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 99931, - "real_time": 6.9527248485636383e+03, - "cpu_time": 7.1787240251248395e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6820096519839555e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9483692471832346e+03, - "cpu_time": 7.1950545055079913e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6843215112713777e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9526833767164962e+03, - "cpu_time": 7.1790349418671393e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.6820316146900341e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8675377200578795e+00, - "cpu_time": 3.1448225481560836e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1762842613081310e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1322854960892101e-03, - "cpu_time": 4.3708112923239771e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1335287239541121e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100903, - "real_time": 6.9363132485674296e+03, - "cpu_time": 7.2682166377887535e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3814428739322633e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100903, - "real_time": 6.9567752670892860e+03, - "cpu_time": 7.2750670779364729e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3597317771948203e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100903, - "real_time": 6.9352290564895438e+03, - "cpu_time": 7.2545554379083204e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3825968231129020e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100903, - "real_time": 6.9602632543805348e+03, - "cpu_time": 7.2804252540530586e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3560436047841415e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100903, - "real_time": 6.9350225309360894e+03, - "cpu_time": 7.2675468161302674e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3828166774663702e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9447206714925778e+03, - "cpu_time": 7.2691622447633743e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3725263512980983e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9363132485674287e+03, - "cpu_time": 7.2682166377887547e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.3814428739322633e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2666043222634503e+01, - "cpu_time": 9.7286307071153575e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3436811846100251e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8238376778244537e-03, - "cpu_time": 1.3383427662690783e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8225518914197437e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100378, - "real_time": 6.9720638741581715e+03, - "cpu_time": 7.2247429201464593e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4687186154381594e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100378, - "real_time": 6.9715572781115561e+03, - "cpu_time": 7.2298279535716879e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4688253415273944e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100378, - "real_time": 6.9712570517114709e+03, - "cpu_time": 7.2294225664568448e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4688885984323359e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100378, - "real_time": 6.9734606749441691e+03, - "cpu_time": 7.2347207310151958e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4684244276005733e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100378, - "real_time": 6.9686468529608219e+03, - "cpu_time": 7.2210183991475213e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4694387900642797e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9713971463772377e+03, - "cpu_time": 7.2279465140675426e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4688591546125486e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9715572781115570e+03, - "cpu_time": 7.2294225664568448e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4688253415273944e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7544271618776162e+00, - "cpu_time": 5.2409529385646561e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6970473083259298e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5166076828506655e-04, - "cpu_time": 7.2509570019151949e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5169515380125919e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 99409, - "real_time": 7.0296708235049655e+03, - "cpu_time": 7.2028132816668463e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9133654354797733e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 99409, - "real_time": 7.0320981908896156e+03, - "cpu_time": 7.2114789465468276e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9123597885098815e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 99409, - "real_time": 7.0199990163369339e+03, - "cpu_time": 7.1911924232975781e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9173793261706966e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 99409, - "real_time": 7.0454282376389328e+03, - "cpu_time": 7.2003031626352668e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9068495638901389e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 99409, - "real_time": 7.0397093662026546e+03, - "cpu_time": 7.1978693286080098e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9092110106595612e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0333811269146199e+03, - "cpu_time": 7.2007314285509062e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9118330249420100e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0320981908896138e+03, - "cpu_time": 7.2003031626352668e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9123597885098815e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7425952529120465e+00, - "cpu_time": 7.4028863366634282e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0341375221972790e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3851937037266590e-03, - "cpu_time": 1.0280742185871533e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3854288647878838e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 97139, - "real_time": 7.1961904921359219e+03, - "cpu_time": 7.1186574698032343e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6919004638303494e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 97139, - "real_time": 7.1970441174233465e+03, - "cpu_time": 7.1036118981330514e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6912253602614176e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 97139, - "real_time": 7.1937777857726460e+03, - "cpu_time": 7.1211958870937479e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6938094586418617e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 97139, - "real_time": 7.1983733907347105e+03, - "cpu_time": 7.1078585640650475e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6901744014447916e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 97139, - "real_time": 7.1943742018921375e+03, - "cpu_time": 7.1149803532088161e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6933374398606372e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1959519975917528e+03, - "cpu_time": 7.1132608344607794e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6920894248078120e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1961904921359210e+03, - "cpu_time": 7.1149803532088161e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.6919004638303494e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8927088016525606e+00, - "cpu_time": 7.3710917738651298e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4971377892498739e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6302410053402077e-04, - "cpu_time": 1.0362465183555855e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6302077805118521e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 81349, - "real_time": 8.6277405924061241e+03, - "cpu_time": 6.5511047706587470e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.4949539943404758e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 81349, - "real_time": 8.5961960512181777e+03, - "cpu_time": 6.5435076739246416e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.5297966114198875e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 81349, - "real_time": 8.6271941203081606e+03, - "cpu_time": 6.5492019744015837e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.4955554329260695e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 81349, - "real_time": 8.6079599556731791e+03, - "cpu_time": 6.5410289167983150e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.5167728964642358e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 81349, - "real_time": 8.6288911413170281e+03, - "cpu_time": 6.5496438866788411e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.4936879673622298e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6175963721845346e+03, - "cpu_time": 6.5468974444924259e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.5061533805025816e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6271941203081606e+03, - "cpu_time": 6.5492019744015849e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.4955554329260695e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4776908026437146e+01, - "cpu_time": 4.3728011081922951e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6316446880862266e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7147366142760342e-03, - "cpu_time": 6.6791959783498854e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7164089645689716e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72395, - "real_time": 9.6864911434207625e+03, - "cpu_time": 6.2238167465198445e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6914277582474544e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72395, - "real_time": 9.6755187503660472e+03, - "cpu_time": 6.2250405423591614e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6933458993483069e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72395, - "real_time": 9.6844801810678109e+03, - "cpu_time": 6.2182595340294409e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6917789797359574e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72395, - "real_time": 9.6777723546929992e+03, - "cpu_time": 6.2236428097238469e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6929515801283526e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72395, - "real_time": 9.6866169030013298e+03, - "cpu_time": 6.2188198871345830e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6914057987493582e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6821758665097896e+03, - "cpu_time": 6.2219159039533758e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6921820032418861e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6844801810678091e+03, - "cpu_time": 6.2236428097238469e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.6917789797359574e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1807913774510510e+00, - "cpu_time": 3.1350092642319284e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0563646145680337e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.3508544451988068e-04, - "cpu_time": 5.0386557977100891e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3518856702280428e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 66463, - "real_time": 1.0537148694112646e+04, - "cpu_time": 6.0318896986986029e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.1097596656587238e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 66463, - "real_time": 1.0539309920599095e+04, - "cpu_time": 6.0430031486049366e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.1091219678391757e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 66463, - "real_time": 1.0536645782898398e+04, - "cpu_time": 6.0392536905566216e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.1099080936349220e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 66463, - "real_time": 1.0536977769770885e+04, - "cpu_time": 6.0492933639775312e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.1098101102582569e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 66463, - "real_time": 1.0536134138985959e+04, - "cpu_time": 6.0383528165400147e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.1100591134988837e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0537243261273397e+04, - "cpu_time": 6.0403585436755407e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.1097317901779928e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0536977769770885e+04, - "cpu_time": 6.0392536905566227e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.1098101102582569e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2183638740668701e+00, - "cpu_time": 6.3990219180705084e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5951975433903490e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1562453706887603e-04, - "cpu_time": 1.0593778286175576e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1561117761813694e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 57356, - "real_time": 1.2188810258673164e+04, - "cpu_time": 5.7822117046191728e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3767347763385429e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 57356, - "real_time": 1.2198693670569746e+04, - "cpu_time": 5.7876500490762603e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3723785324743795e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 57356, - "real_time": 1.2179646636829375e+04, - "cpu_time": 5.7739753925772643e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3807800795984697e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 57356, - "real_time": 1.2188266183960861e+04, - "cpu_time": 5.7774395020996082e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3769747895924730e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 57356, - "real_time": 1.2185959249634965e+04, - "cpu_time": 5.7654295967588151e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3779927092701511e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2188275199933623e+04, - "cpu_time": 5.7773412490262246e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3769721774548035e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2188266183960859e+04, - "cpu_time": 5.7774395020996082e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3769747895924730e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8674344973026447e+00, - "cpu_time": 8.4145528569221613e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0290074384325966e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.6344596627913731e-04, - "cpu_time": 1.4564749586741894e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6332957256743346e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 46077, - "real_time": 1.5191373128868201e+04, - "cpu_time": 5.4892280992139626e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6280548103267612e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 46077, - "real_time": 1.5189789756604110e+04, - "cpu_time": 5.4895713766990983e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6289541922733612e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 46077, - "real_time": 1.5192116185151312e+04, - "cpu_time": 5.4843091450315320e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6276328065545616e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 46077, - "real_time": 1.5189372867480923e+04, - "cpu_time": 5.4940993190373075e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6291910234564934e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 46077, - "real_time": 1.5192991569824446e+04, - "cpu_time": 5.4855521283637083e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6271357025122433e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5191128701585802e+04, - "cpu_time": 5.4885520136691213e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6281937070246849e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5191373128868203e+04, - "cpu_time": 5.4892280992139637e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6280548103267612e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5314105898670933e+00, - "cpu_time": 3.8493517518479779e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6980644467605546e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0080953298139258e-04, - "cpu_time": 7.0134194633871526e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0080979567808015e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 35392, - "real_time": 1.9778104666587667e+04, - "cpu_time": 5.3958604618936265e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3254252842682926e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 35392, - "real_time": 1.9777143567107174e+04, - "cpu_time": 5.4072814316786623e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3254896952661608e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 35392, - "real_time": 1.9781900817964033e+04, - "cpu_time": 5.3944250651946270e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3251709348474028e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 35392, - "real_time": 1.9780397640265182e+04, - "cpu_time": 5.4042009810756898e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3252716389602652e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 35392, - "real_time": 1.9779532523415819e+04, - "cpu_time": 5.3918636360826254e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3253296036681517e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9779415843067974e+04, - "cpu_time": 5.3987263151850486e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3253374314020548e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9779532523415819e+04, - "cpu_time": 5.3958604618936265e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3253296036681517e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8731699088346030e+00, - "cpu_time": 6.6515452300622850e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2551238075026702e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.4702994451228276e-05, - "cpu_time": 1.2320582377649747e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4702207737005768e-05, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 22717, - "real_time": 3.0815428278965413e+04, - "cpu_time": 5.1999826942006099e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7013815133566668e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 22717, - "real_time": 3.0834276954320099e+04, - "cpu_time": 5.2408304596832561e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7003414763923744e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 22717, - "real_time": 3.0811403137988491e+04, - "cpu_time": 5.1829136498940986e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7016037784841627e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 22717, - "real_time": 3.0819117982746393e+04, - "cpu_time": 5.1951313165844136e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7011778218101974e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 22717, - "real_time": 3.0825437069540509e+04, - "cpu_time": 5.2234109093560517e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7008290874099686e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0821132684712182e+04, - "cpu_time": 5.2084538059436876e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7010667354906738e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0819117982746393e+04, - "cpu_time": 5.1999826942006093e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7011778218101974e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9800181050386190e+00, - "cpu_time": 2.3310462660187325e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9555974060853655e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9135912027960164e-04, - "cpu_time": 4.4755053090009787e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9132292711937135e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 13947, - "real_time": 5.0220634011934730e+04, - "cpu_time": 5.3114511841874307e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0879385946238953e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 13947, - "real_time": 5.0234640356590098e+04, - "cpu_time": 5.3125384899404556e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0873564388173054e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 13947, - "real_time": 5.0261956967551137e+04, - "cpu_time": 5.3158193716267276e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0862219922653538e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 13947, - "real_time": 5.0231222910978402e+04, - "cpu_time": 5.3107464896477294e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0874984506316410e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 13947, - "real_time": 5.0182076211573461e+04, - "cpu_time": 5.3085082034607065e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0895428789735237e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0226106091725567e+04, - "cpu_time": 5.3118127477726108e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0877116710623440e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0231222910978395e+04, - "cpu_time": 5.3114511841874301e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0874984506316410e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8952006914617005e+01, - "cpu_time": 2.6817617380819388e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2037039223888904e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7643343606496832e-04, - "cpu_time": 5.0486752177144722e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7656617006714280e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7647, - "real_time": 9.1445739975841730e+04, - "cpu_time": 5.0893247577940094e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2933293563527714e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7647, - "real_time": 9.1477877017632389e+04, - "cpu_time": 5.0884945308251888e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2925236880997723e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7647, - "real_time": 9.1397781555941969e+04, - "cpu_time": 5.0881037285929888e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2945327165478226e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7647, - "real_time": 9.1411468100341765e+04, - "cpu_time": 5.0870168994951719e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2941891685821850e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7647, - "real_time": 9.1418623072681934e+04, - "cpu_time": 5.0904359453495461e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2940096115128201e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1430297944487975e+04, - "cpu_time": 5.0886751724113828e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2937169082190746e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1418623072681934e+04, - "cpu_time": 5.0884945308251888e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2940096115128201e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1821398902780594e+01, - "cpu_time": 1.2875685393432202e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9815709549035523e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4803997819301652e-04, - "cpu_time": 2.5302627810159031e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4797541607262838e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4022, - "real_time": 1.7408934545908510e+05, - "cpu_time": 4.9270534173992813e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4092824227349148e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4022, - "real_time": 1.7409073495714078e+05, - "cpu_time": 4.9279720368918884e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4092631931461437e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4022, - "real_time": 1.7405532706478654e+05, - "cpu_time": 4.9287974945201325e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4097533070267963e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4022, - "real_time": 1.7412379052986571e+05, - "cpu_time": 4.9298195015417194e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4088058198345924e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4022, - "real_time": 1.7403046825811177e+05, - "cpu_time": 4.9272101109574610e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4100975202682640e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7407793325379799e+05, - "cpu_time": 4.9281705122620964e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4094404526021423e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7408934545908507e+05, - "cpu_time": 4.9279720368918884e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4092824227349148e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5919971455466175e+01, - "cpu_time": 1.1534661318083483e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9718429967166102e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0634419759049202e-04, - "cpu_time": 2.3405564578951463e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0634844871750740e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2067, - "real_time": 3.3877316291419673e+05, - "cpu_time": 4.8824139507207346e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4761725302675869e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2067, - "real_time": 3.3884151756153390e+05, - "cpu_time": 4.8800447544267660e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4756730109015114e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2067, - "real_time": 3.3882224057536584e+05, - "cpu_time": 4.8785725500628287e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4758138620873920e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2067, - "real_time": 3.3879220504216838e+05, - "cpu_time": 4.8816656907401931e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4760333547095329e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2067, - "real_time": 3.3885645462730812e+05, - "cpu_time": 4.8813806293419278e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4755638812388050e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3881711614411464e+05, - "cpu_time": 4.8808155150584900e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4758513278409653e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3882224057536584e+05, - "cpu_time": 4.8813806293419278e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4758138620873920e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4357148153701409e+01, - "cpu_time": 1.5183966315003525e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5106321473286366e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0140322467973466e-04, - "cpu_time": 3.1109486249085493e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0140480242478862e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1046, - "real_time": 6.6940435724792362e+05, - "cpu_time": 4.8463720939194781e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5062902292681545e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1046, - "real_time": 6.6950762008688983e+05, - "cpu_time": 4.8457237224092776e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5059036666113857e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1046, - "real_time": 6.6957844873795903e+05, - "cpu_time": 4.8427772593787277e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5056385897159901e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1046, - "real_time": 6.6938326103313616e+05, - "cpu_time": 4.8443575993308067e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5063692172561638e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1046, - "real_time": 6.6936109632380086e+05, - "cpu_time": 4.8443861004396760e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5064522112417610e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6944695668594190e+05, - "cpu_time": 4.8447233550955933e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5061307828186909e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6940435724792362e+05, - "cpu_time": 4.8443861004396760e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5062902292681545e+10, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2485212672424751e+01, - "cpu_time": 1.3922895731211343e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4620305074565709e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3815166645953162e-04, - "cpu_time": 2.8738267824038891e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3814245175037363e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 71, - "real_time": 9.7161723484455701e+06, - "cpu_time": 6.9548810798592114e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4534620009460993e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 71, - "real_time": 9.7455674598754290e+06, - "cpu_time": 6.9662771101407552e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4430454807429862e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 71, - "real_time": 9.7286073805790544e+06, - "cpu_time": 6.9636898254930520e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4490478120212526e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 71, - "real_time": 9.7122040354240108e+06, - "cpu_time": 6.9552773847888350e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4548730522561655e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 71, - "real_time": 9.7204361793021075e+06, - "cpu_time": 6.9609572388734674e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4519471535081964e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7245974807252362e+06, - "cpu_time": 6.9602165278310657e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4504750998949404e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7204361793021075e+06, - "cpu_time": 6.9609572388734674e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4519471535081964e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3207158024059720e+04, - "cpu_time": 5.0548305233427428e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6815300946250465e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3581187345015704e-03, - "cpu_time": 7.2624615960301510e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3567784027096990e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 37, - "real_time": 1.8948359062542785e+07, - "cpu_time": 7.3275471194594157e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5416715388648691e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 37, - "real_time": 1.8915684239284411e+07, - "cpu_time": 7.3228552645943451e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5477893979974132e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 37, - "real_time": 1.8956462827485960e+07, - "cpu_time": 7.3263082975673056e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5401574972465520e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 37, - "real_time": 1.8896350486053001e+07, - "cpu_time": 7.3199655083784986e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5514193097514591e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 37, - "real_time": 1.8940705000548750e+07, - "cpu_time": 7.3263980129729736e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5431027513524828e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8931512323182981e+07, - "cpu_time": 7.3246148405945086e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5448280990425553e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8940705000548750e+07, - "cpu_time": 7.3263082975673056e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5431027513524828e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4888394078850757e+04, - "cpu_time": 3.1368040001064300e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6628469858488813e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3146542998772024e-03, - "cpu_time": 4.2825514629405803e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3153943874198860e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.7407093730412029e+07, - "cpu_time": 7.8870921968418896e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5880287564516339e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.7324373071130954e+07, - "cpu_time": 7.8750799521055257e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5959807749272695e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.7196305237318337e+07, - "cpu_time": 7.8668126668422866e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6083618290491371e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.7204052664731681e+07, - "cpu_time": 7.8668728021051502e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.6076104184003148e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.7285753378742620e+07, - "cpu_time": 7.8784588800001347e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5997054058862147e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7283515616467126e+07, - "cpu_time": 7.8748632995789969e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5999374369429140e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7285753378742620e+07, - "cpu_time": 7.8750799521055245e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5997054058862147e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7843469246882625e+04, - "cpu_time": 8.5320250015886535e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4760059960337449e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3560940483864814e-03, - "cpu_time": 1.0834505536172026e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3544870277611308e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 7.3058352619409561e+07, - "cpu_time": 9.0799446999998856e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6742610033706703e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 7.3467407375574112e+07, - "cpu_time": 9.0970657960000956e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6538033066516976e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 7.3472016304731369e+07, - "cpu_time": 9.1046235060003376e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6535741020995173e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 7.3133391886949539e+07, - "cpu_time": 9.0747465910000074e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6704909901478481e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 7.3598980903625488e+07, - "cpu_time": 9.1075316110000134e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6472713712096639e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3346029818058029e+07, - "cpu_time": 9.0927824408000684e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6598801546958795e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3467407375574112e+07, - "cpu_time": 9.0970657960000956e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6538033066516976e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3588260763534499e+05, - "cpu_time": 1.4715599250921644e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1780008914468613e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2160242104511284e-03, - "cpu_time": 1.6183824199830770e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2186870653002245e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4363502860069275e+08, - "cpu_time": 1.0895625713999722e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7377436216656322e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4328728318214417e+08, - "cpu_time": 1.0878594270000122e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7468147910763268e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4357064068317413e+08, - "cpu_time": 1.0894475270000043e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7394199081742969e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4301749169826508e+08, - "cpu_time": 1.0866443969999864e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7538828686261506e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4365528225898743e+08, - "cpu_time": 1.0899903119999747e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7372166449967909e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4343314528465271e+08, - "cpu_time": 1.0887008468799901e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7430155669078393e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4357064068317413e+08, - "cpu_time": 1.0894475270000043e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7394199081742969e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7525004546019703e+05, - "cpu_time": 1.4053286242467305e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1916968550127307e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9190128258983990e-03, - "cpu_time": 1.2908308359216728e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9213643989607818e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8568084537982941e+08, - "cpu_time": 1.3095175205000374e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7585362874868193e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8608894348144531e+08, - "cpu_time": 1.3160597450000181e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7531748376345029e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8573444485664368e+08, - "cpu_time": 1.3160235745000365e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7578312427075739e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8603863716125488e+08, - "cpu_time": 1.3156852230000310e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7538349177446117e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8553828597068787e+08, - "cpu_time": 1.3141140364999728e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7604127949070401e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8581623136997223e+08, - "cpu_time": 1.3142800199000192e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7567580160961099e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8573444485664368e+08, - "cpu_time": 1.3156852230000310e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7578312427075739e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3775422012796212e+05, - "cpu_time": 2.7789814163428601e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1247057669355045e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.3184296073165738e-04, - "cpu_time": 2.1144515432519962e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.3175593252146390e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 102255, - "real_time": 6.8484361358507349e+03, - "cpu_time": 7.2839379970801342e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7380796859573677e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 102255, - "real_time": 6.8462456280277884e+03, - "cpu_time": 7.2935433273026943e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7392757126908168e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 102255, - "real_time": 6.8538754311041830e+03, - "cpu_time": 7.2699816315656304e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7351131133522436e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 102255, - "real_time": 6.8490449688680901e+03, - "cpu_time": 7.2824897000005317e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7377473963688679e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 102255, - "real_time": 6.8456261915812220e+03, - "cpu_time": 7.2668517947522902e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7396140664944544e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8486456710864049e+03, - "cpu_time": 7.2793608901402557e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7379659949727498e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8484361358507349e+03, - "cpu_time": 7.2824897000005317e+08, - "time_unit": "ns", - "bytes": 2.5600000000000000e+02, - "bytes_per_second": 3.7380796859573677e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2569616486729140e+00, - "cpu_time": 1.0912479574331972e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7770160935891941e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):8/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7556287842764975e-04, - "cpu_time": 1.4990985800845101e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7539653811167127e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 102123, - "real_time": 6.8495124400909181e+03, - "cpu_time": 7.2719138972379589e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4749845989505768e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 102123, - "real_time": 6.8517936474987573e+03, - "cpu_time": 7.2654737067598474e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4724959089640021e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 102123, - "real_time": 6.8603435568860477e+03, - "cpu_time": 7.2582593411996472e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4631830863059580e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 102123, - "real_time": 6.8571205472621796e+03, - "cpu_time": 7.2476836612865746e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4666909597268865e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 102123, - "real_time": 6.8548179513394971e+03, - "cpu_time": 7.2285607977197921e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4691990893784478e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8547176286154809e+03, - "cpu_time": 7.2543782808407640e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4693107286651745e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8548179513394962e+03, - "cpu_time": 7.2582593411996472e+08, - "time_unit": "ns", - "bytes": 5.1200000000000000e+02, - "bytes_per_second": 7.4691990893784478e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2743070977894551e+00, - "cpu_time": 1.7007566800650614e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6573015537433261e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):9/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.2355699087385773e-04, - "cpu_time": 2.3444554643047210e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2352494399113361e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 101595, - "real_time": 6.8738231721046468e+03, - "cpu_time": 7.2027767068654752e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4897095464363956e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 101595, - "real_time": 6.8887374931707363e+03, - "cpu_time": 7.2259923794683099e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4864842810676983e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 101595, - "real_time": 6.8689065384965234e+03, - "cpu_time": 7.1906261180905735e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4907758524024621e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 101595, - "real_time": 6.8880739868229139e+03, - "cpu_time": 7.2109028359041107e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4866274693897626e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 101595, - "real_time": 6.8707409000927728e+03, - "cpu_time": 7.1853838279591227e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4903778426372814e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8780564181375184e+03, - "cpu_time": 7.2031363736575174e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4887949983867201e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8738231721046468e+03, - "cpu_time": 7.2027767068654752e+08, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.4897095464363956e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6124206093596936e+00, - "cpu_time": 1.6236561141599903e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0798541516173678e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3975489622346834e-03, - "cpu_time": 2.2540960353018423e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3970050637402247e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100653, - "real_time": 6.9667087701692708e+03, - "cpu_time": 7.1769785341178453e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9396951524216497e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100653, - "real_time": 6.9565753642958871e+03, - "cpu_time": 7.1984533576336956e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9439773060049194e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100653, - "real_time": 6.9719639458366664e+03, - "cpu_time": 7.1830603203338289e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9374793328111953e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100653, - "real_time": 6.9561093812928893e+03, - "cpu_time": 7.1940705447561657e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9441745201817840e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100653, - "real_time": 6.9655326508378321e+03, - "cpu_time": 7.1770669228735065e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9401915153662533e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9633780224865095e+03, - "cpu_time": 7.1859259359430087e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9411035653571606e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9655326508378321e+03, - "cpu_time": 7.1830603203338289e+08, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.9401915153662533e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8659246736578154e+00, - "cpu_time": 9.8744722865029122e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8999858868622105e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.8600487457179667e-04, - "cpu_time": 1.3741405595501849e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.8601964276971775e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 98360, - "real_time": 7.1272402137021882e+03, - "cpu_time": 7.1045910245265937e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.7469649923197484e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 98360, - "real_time": 7.1407990328581236e+03, - "cpu_time": 7.1236857970747590e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.7360527598555946e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 98360, - "real_time": 7.1374168338831387e+03, - "cpu_time": 7.1160328804107273e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.7387708961528528e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 98360, - "real_time": 7.1272451260138196e+03, - "cpu_time": 7.1187030544560134e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.7469610313386858e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 98360, - "real_time": 7.1313202549518901e+03, - "cpu_time": 7.1059993780930352e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.7436769820508265e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1328042922818322e+03, - "cpu_time": 7.1138024269122255e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.7424853323435426e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1313202549518883e+03, - "cpu_time": 7.1160328804107273e+08, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.7436769820508265e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1085408180325382e+00, - "cpu_time": 8.2524175817115302e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9166627144842874e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.5640101252215553e-04, - "cpu_time": 1.1600571798974640e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5619073100492678e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 94549, - "real_time": 7.4070241870890504e+03, - "cpu_time": 6.9712258698073673e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.1059772174470844e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 94549, - "real_time": 7.4057946887364305e+03, - "cpu_time": 6.9771897198414624e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.1061608300402007e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 94549, - "real_time": 7.4064775102638532e+03, - "cpu_time": 6.9770830473361874e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.1060588503303459e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 94549, - "real_time": 7.4058446985120900e+03, - "cpu_time": 6.9842584715178740e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.1061533604189482e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 94549, - "real_time": 7.4082446421598852e+03, - "cpu_time": 6.9735957904288101e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.1057950156478109e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4066771453522624e+03, - "cpu_time": 6.9766705797863412e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.1060290547768781e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4064775102638541e+03, - "cpu_time": 6.9770830473361874e+08, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.1060588503303459e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0110682153656385e+00, - "cpu_time": 4.9273454593015619e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5096838238518688e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3650766673421028e-04, - "cpu_time": 7.0626030037560699e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3649585581243352e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 89931, - "real_time": 7.7889845918109459e+03, - "cpu_time": 6.8231781505169857e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1034834267390308e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 89931, - "real_time": 7.7859605615158689e+03, - "cpu_time": 6.8379164299266994e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1043004097634623e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 89931, - "real_time": 7.7883657211345599e+03, - "cpu_time": 6.8250424296609080e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1036505714594617e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 89931, - "real_time": 7.7866978973535897e+03, - "cpu_time": 6.8305448498866165e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1041011499326708e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 89931, - "real_time": 7.7905507523821607e+03, - "cpu_time": 6.8380009738194025e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1030605564042017e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7881119048394248e+03, - "cpu_time": 6.8309365667621219e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1037192228597653e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7883657211345590e+03, - "cpu_time": 6.8305448498866153e+08, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1036505714594617e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8304151093580383e+00, - "cpu_time": 6.9590167008380615e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9441906241567992e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3502681159738394e-04, - "cpu_time": 1.0187500107524275e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3502141209869910e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 81362, - "real_time": 8.6076701777321214e+03, - "cpu_time": 6.5660209113656676e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8068373117699366e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 81362, - "real_time": 8.6037865211125900e+03, - "cpu_time": 6.5728230986929035e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8085556771534867e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 81362, - "real_time": 8.6073227580219864e+03, - "cpu_time": 6.5567211592792988e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8069909681800151e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 81362, - "real_time": 8.6024279442364968e+03, - "cpu_time": 6.5731332374391627e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8091571603286824e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 81362, - "real_time": 8.6057074537810240e+03, - "cpu_time": 6.5637967558046961e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8077055461143961e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6053829709768434e+03, - "cpu_time": 6.5664990325163448e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8078493327093034e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6057074537810222e+03, - "cpu_time": 6.5660209113656676e+08, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8077055461143961e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2572224518600130e+00, - "cpu_time": 6.8400327543009014e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9887263812760438e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6230354412730840e-04, - "cpu_time": 1.0416559448847942e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6231937003056306e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 67958, - "real_time": 1.0302569364955414e+04, - "cpu_time": 6.1650037270971119e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.3611316438133593e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 67958, - "real_time": 1.0295583253538312e+04, - "cpu_time": 6.1759700243177187e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.3654480165052385e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 67958, - "real_time": 1.0308985166918201e+04, - "cpu_time": 6.1706597862686074e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.3571727904223509e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 67958, - "real_time": 1.0297161501054032e+04, - "cpu_time": 6.1724547014867508e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.3644723833156977e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 67958, - "real_time": 1.0323667581841943e+04, - "cpu_time": 6.1592305842869616e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.3481315608485622e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0305593373661581e+04, - "cpu_time": 6.1686637646914315e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.3592712789810410e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0302569364955416e+04, - "cpu_time": 6.1706597862686074e+08, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 6.3611316438133593e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1386668433271826e+01, - "cpu_time": 6.5976795406276174e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0207105131945154e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1049017771624088e-03, - "cpu_time": 1.0695476025767221e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1040117971377781e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 53497, - "real_time": 1.3090852139985167e+04, - "cpu_time": 5.7782888470064843e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0012488002950474e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 53497, - "real_time": 1.3085423678109963e+04, - "cpu_time": 5.7836625980563581e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0016641663598915e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 53497, - "real_time": 1.3088462134745285e+04, - "cpu_time": 5.7869685774940419e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0014316323080442e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 53497, - "real_time": 1.3085665950246046e+04, - "cpu_time": 5.7829706937530529e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0016456212343971e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 53497, - "real_time": 1.3089028020318825e+04, - "cpu_time": 5.7821752833771384e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0013883368308910e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3087886384681060e+04, - "cpu_time": 5.7828131999374175e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0014757114056543e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3088462134745285e+04, - "cpu_time": 5.7829706937530541e+08, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0014316323080442e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3143993415054251e+00, - "cpu_time": 3.1180984202165238e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7709499950026821e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7683522560329936e-04, - "cpu_time": 5.3920095849720152e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7683404348538885e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 39138, - "real_time": 1.7888081201012868e+04, - "cpu_time": 5.4520939953593600e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4654674084616560e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 39138, - "real_time": 1.7884748147024398e+04, - "cpu_time": 5.4417889453689992e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4657405172552828e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 39138, - "real_time": 1.7890784688816591e+04, - "cpu_time": 5.4498379685855150e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4652459607535517e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 39138, - "real_time": 1.7890662272893282e+04, - "cpu_time": 5.4460724041128600e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4652559866226015e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 39138, - "real_time": 1.7890714834102113e+04, - "cpu_time": 5.4512951031260931e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4652516818406733e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7888998228769855e+04, - "cpu_time": 5.4482176833105636e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4653923109867531e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7890662272893282e+04, - "cpu_time": 5.4498379685855138e+08, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4652559866226015e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6368234094501313e+00, - "cpu_time": 4.2735385390184785e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1602460209522434e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4739916543842456e-04, - "cpu_time": 7.8439203193175246e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4741758945750137e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 24145, - "real_time": 2.9013589618722359e+04, - "cpu_time": 5.1883634234059668e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.8070428612586391e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 24145, - "real_time": 2.9001993029025420e+04, - "cpu_time": 5.2171856186370760e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.8077654162432510e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 24145, - "real_time": 2.9012961658830627e+04, - "cpu_time": 5.2240580276229346e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.8070819731029537e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 24145, - "real_time": 2.9002345490259024e+04, - "cpu_time": 5.1905080833747369e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.8077434467363750e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 24145, - "real_time": 2.9016439746548080e+04, - "cpu_time": 5.2022745702263093e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.8068653652189415e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9009465908677103e+04, - "cpu_time": 5.2044779446534050e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.8072998125120327e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9012961658830627e+04, - "cpu_time": 5.2022745702263099e+08, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.8070819731029537e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7897709292952513e+00, - "cpu_time": 1.5847352343602278e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2303089660401875e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3405363444710452e-04, - "cpu_time": 3.0449456241585897e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3406791373260449e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 13500, - "real_time": 5.1772802291250424e+04, - "cpu_time": 5.1396943129285902e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0253414024243549e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 13500, - "real_time": 5.1756764818424861e+04, - "cpu_time": 5.1421504139484298e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0259689794728401e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 13500, - "real_time": 5.1743254803080126e+04, - "cpu_time": 5.1425103681124133e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0264979541595848e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 13500, - "real_time": 5.1800261916435338e+04, - "cpu_time": 5.1351280668730170e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0242677569692070e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 13500, - "real_time": 5.1762609208472655e+04, - "cpu_time": 5.1449032633060032e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0257402322531414e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1767138607532695e+04, - "cpu_time": 5.1408772850336903e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0255632650558258e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1762609208472655e+04, - "cpu_time": 5.1421504139484292e+08, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.0257402322531414e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1376377005141439e+01, - "cpu_time": 3.7063881029560952e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.3623105730988011e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1293333145577687e-04, - "cpu_time": 7.2096412683225633e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1283877513785435e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7664, - "real_time": 9.1309063604502197e+04, - "cpu_time": 5.0218371630450851e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2967621364332943e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7664, - "real_time": 9.1330230529127221e+04, - "cpu_time": 5.0230105824518043e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2962298330465424e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7664, - "real_time": 9.1287914332428816e+04, - "cpu_time": 5.0218733449096096e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2972942424373199e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7664, - "real_time": 9.1320860050784526e+04, - "cpu_time": 5.0266113440414649e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2964654503185265e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7664, - "real_time": 9.1317477290621144e+04, - "cpu_time": 5.0243313943044686e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2965505204723721e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1313109161492786e+04, - "cpu_time": 5.0235327657504863e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2966604365416115e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1317477290621144e+04, - "cpu_time": 5.0230105824518043e+08, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2965505204723721e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5995655629792612e+01, - "cpu_time": 2.0010543060781184e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0235969935767674e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7517370481278126e-04, - "cpu_time": 3.9833607132433479e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7519337772176871e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4014, - "real_time": 1.7426044831686298e+05, - "cpu_time": 4.8792193099879640e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4069167963882267e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4014, - "real_time": 1.7442562973133035e+05, - "cpu_time": 4.8911955892895830e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4046374414474129e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4014, - "real_time": 1.7429557301855925e+05, - "cpu_time": 4.8785436617013967e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4064317454312992e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4014, - "real_time": 1.7448422920999318e+05, - "cpu_time": 4.8803888606323403e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4038298584292805e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4014, - "real_time": 1.7424793403954618e+05, - "cpu_time": 4.8864577830687499e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4070896582613644e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7434276286325842e+05, - "cpu_time": 4.8831610409360063e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4057810999915169e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7429557301855925e+05, - "cpu_time": 4.8803888606323397e+08, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.4064317454312992e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0591826665039991e+02, - "cpu_time": 5.4764243218697188e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4612297080845298e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.0752889830864045e-04, - "cpu_time": 1.1214916477176010e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0738265342997425e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2063, - "real_time": 3.3931270205283514e+05, - "cpu_time": 4.8426109110029310e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4722351828413990e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2063, - "real_time": 3.3933899305380299e+05, - "cpu_time": 4.8456488892093170e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4720436412298683e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2063, - "real_time": 3.3920815516867273e+05, - "cpu_time": 4.8442316224525923e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4729971470847237e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2063, - "real_time": 3.3930277997439151e+05, - "cpu_time": 4.8436370201840097e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4723074773018719e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2063, - "real_time": 3.3932076676234504e+05, - "cpu_time": 4.8577185519578326e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4721764246970627e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3929667940240947e+05, - "cpu_time": 4.8467693989613360e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4723519746309853e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3931270205283514e+05, - "cpu_time": 4.8442316224525917e+08, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 2.4722351828413990e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1237506455225706e+01, - "cpu_time": 6.2186136309157859e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7341501448549172e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5101092809239515e-04, - "cpu_time": 1.2830430167047840e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5103634851232150e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1045, - "real_time": 6.6971041994062404e+05, - "cpu_time": 4.8201730871488458e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5051448358064152e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1045, - "real_time": 6.7007911445029324e+05, - "cpu_time": 4.8191839092635822e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5037664416332947e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1045, - "real_time": 6.6970367425758590e+05, - "cpu_time": 4.8189723732923561e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5051700692248310e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1045, - "real_time": 6.6996671679389605e+05, - "cpu_time": 4.8238196888989627e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5041864885895859e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1045, - "real_time": 6.7001006072476215e+05, - "cpu_time": 4.8276667727267593e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5040244891027122e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6989399723343237e+05, - "cpu_time": 4.8219631662661016e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5044584648713680e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6996671679389593e+05, - "cpu_time": 4.8201730871488458e+08, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.5041864885895859e+10, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7532163984461531e+02, - "cpu_time": 3.7366863092101464e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5549371510884836e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6171549613620800e-04, - "cpu_time": 7.7493049622435377e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6173071915669215e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 71, - "real_time": 9.6978473306541704e+06, - "cpu_time": 6.9404968377459455e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4599876504486666e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 71, - "real_time": 9.7209955368873104e+06, - "cpu_time": 6.9562010388731992e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4517485243845944e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 71, - "real_time": 9.7227759633055869e+06, - "cpu_time": 6.9534157977467251e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4511164431471720e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 71, - "real_time": 9.7168694630684983e+06, - "cpu_time": 6.9477946567603242e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4532142401966381e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 71, - "real_time": 9.7225235224189889e+06, - "cpu_time": 6.9503368321124971e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4512060498107767e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7162023632669114e+06, - "cpu_time": 6.9496490326477396e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4534545815975704e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7209955368873104e+06, - "cpu_time": 6.9503368321124983e+08, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4517485243845944e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0529672694526324e+04, - "cpu_time": 6.0164722719658841e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7474047821072116e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0837230741853232e-03, - "cpu_time": 8.6572318166025053e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0851177259072740e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 37, - "real_time": 1.9172685573229920e+07, - "cpu_time": 7.3792731213516283e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5002328569817843e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 37, - "real_time": 1.9132516422384493e+07, - "cpu_time": 7.3624571481077754e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5075816750108500e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 37, - "real_time": 1.9094444761002384e+07, - "cpu_time": 7.3607924394597733e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5145753039679923e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 37, - "real_time": 1.9114661055642206e+07, - "cpu_time": 7.3628402559461391e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5108581734537749e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 37, - "real_time": 1.9156672463223740e+07, - "cpu_time": 7.3689100143245602e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5031587103048859e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9134196055096548e+07, - "cpu_time": 7.3668545958379757e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5072813439438577e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9132516422384497e+07, - "cpu_time": 7.3628402559461391e+08, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.5075816750108500e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1429423635843610e+04, - "cpu_time": 7.5935290276164142e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7611421936418125e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6425787394120550e-03, - "cpu_time": 1.0307694999038670e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6426233394676972e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.7568856030702591e+07, - "cpu_time": 7.9090183836836720e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5725795826817975e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.7438060892255686e+07, - "cpu_time": 7.8904867878950906e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5850608926105957e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.7396940157601707e+07, - "cpu_time": 7.8837894468419063e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5890029353836708e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.7417479447628319e+07, - "cpu_time": 7.8890834536842275e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5870328515275574e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.7475568291388057e+07, - "cpu_time": 7.8906135178947592e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5814727866540031e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7459380963915274e+07, - "cpu_time": 7.8925983179999304e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5830298097715249e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7438060892255679e+07, - "cpu_time": 7.8904867878950906e+08, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5850608926105957e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7742078198577772e+04, - "cpu_time": 9.5912333681367652e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4703059741931837e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8084142464562857e-03, - "cpu_time": 1.2152187380755095e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8058197441024831e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.3962683478991196e+07, - "cpu_time": 8.4144696300004148e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6293363541392875e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.3741830057568014e+07, - "cpu_time": 8.4004143733339894e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6402060511712356e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.3939198421107396e+07, - "cpu_time": 8.4093002577781641e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6304891279882989e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.3666060964266464e+07, - "cpu_time": 8.3976704033338785e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6439501784982266e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.3897884951697454e+07, - "cpu_time": 8.4129973944445479e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6325187950299239e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3841531574726120e+07, - "cpu_time": 8.4069704117781997e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6353001013653946e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3897884951697454e+07, - "cpu_time": 8.4093002577781653e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6325187950299239e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3050155893606119e+05, - "cpu_time": 7.5409345162084536e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4292221273059156e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7673192328628276e-03, - "cpu_time": 8.9698597078961687e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7685533375610841e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4463456571102142e+08, - "cpu_time": 1.0934778209999876e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7119129121088753e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4455555677413940e+08, - "cpu_time": 1.0940667435999331e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7139417119663763e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4454233348369598e+08, - "cpu_time": 1.0936528876000695e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7142814776859660e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4478163421154022e+08, - "cpu_time": 1.0935118559999409e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7081423684966750e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4435479044914246e+08, - "cpu_time": 1.0929844851999631e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7191070024734969e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4457377612590793e+08, - "cpu_time": 1.0935387586799788e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7134770945462780e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4455555677413940e+08, - "cpu_time": 1.0935118559999409e+09, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7139417119663763e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5506101102667564e+05, - "cpu_time": 3.8841013473956374e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9832378027529311e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 21, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0725389844672417e-03, - "cpu_time": 3.5518643638056077e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0726436978978088e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8841078281402588e+08, - "cpu_time": 1.3213358980000293e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7229600555273767e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8932066261768341e+08, - "cpu_time": 1.3251043865000155e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7112517795484009e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8876855969429016e+08, - "cpu_time": 1.3234571104999874e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7183474029746709e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8886136412620544e+08, - "cpu_time": 1.3236674989999528e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7171527845131793e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8888833522796631e+08, - "cpu_time": 1.3238982144999909e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7168057448657231e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8884994089603430e+08, - "cpu_time": 1.3234926216999955e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7173035534858704e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8886136412620544e+08, - "cpu_time": 1.3236674989999528e+09, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7171527845131793e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2506394564572454e+05, - "cpu_time": 1.3643305612190075e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1827069463494569e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 22, - "run_name": "Comm_hipMemcpyAsync_PageableToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1253730730820014e-03, - "cpu_time": 1.0308561897886192e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1251991897264237e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - } - ] -} - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5428487739714671e-03, - "cpu_time": 2.6074273681687640e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5437248099391895e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - } - ] -} diff --git a/results/implicit_managed_GPURdHost_coarse.json b/results/implicit_managed_GPURdHost_coarse.json deleted file mode 100644 index 184d3b1..0000000 --- a/results/implicit_managed_GPURdHost_coarse.json +++ /dev/null @@ -1,25272 +0,0 @@ -{ - "context": { - "date": "2023-10-09T14:45:25-04:00", - "host_name": "frontier10485", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1797, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [2.47,2.62,2.57], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8751100435986668e+06, - "cpu_time": 2.0745011851851849e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1844051307725143e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8677153235311231e+06, - "cpu_time": 2.0668210343915343e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1930536995627671e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8622939680724849e+06, - "cpu_time": 2.0667339391534391e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1994379352683239e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8681128048031561e+06, - "cpu_time": 2.0670184417989426e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1925870801102924e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8641001199535034e+06, - "cpu_time": 2.0669938703703708e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1973068700312981e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8674664519917867e+06, - "cpu_time": 2.0684136941798944e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1933581431490392e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8677153235311233e+06, - "cpu_time": 2.0669938703703706e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1930536995627671e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9242000096242473e+03, - "cpu_time": 3.4050814141484502e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7749452578109249e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6368345221796275e-03, - "cpu_time": 1.6462284231291227e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6329239827289417e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8670017068668837e+06, - "cpu_time": 2.0676265396825387e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3877838835763233e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8626884780205151e+06, - "cpu_time": 2.0678958280423309e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3979442062720358e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8630216313193727e+06, - "cpu_time": 2.0677932301587311e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3971577475450514e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8677094592247775e+06, - "cpu_time": 2.0675929312169293e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3861211707950663e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8616802594493572e+06, - "cpu_time": 2.0676909179894219e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4003259734961195e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8644203069761812e+06, - "cpu_time": 2.0677198894179899e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3938665963369198e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8630216313193727e+06, - "cpu_time": 2.0676909179894216e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3971577475450514e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7361256131991186e+03, - "cpu_time": 1.2450418470591167e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4454081269421231e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4675476355633119e-03, - "cpu_time": 6.0213274217213431e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4669102908849198e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8677965247321476e+06, - "cpu_time": 2.0699868779840847e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7718334320969768e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8637731846149294e+06, - "cpu_time": 2.0700418063660499e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7907692498457469e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8630563602236221e+06, - "cpu_time": 2.0697690954907143e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7941515618096665e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8656884978158802e+06, - "cpu_time": 2.0681071405835564e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7817446584359519e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8613719109769117e+06, - "cpu_time": 2.0683259602122013e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8021098327421919e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8643372956726984e+06, - "cpu_time": 2.0692461761273213e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7881217469861079e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8637731846149296e+06, - "cpu_time": 2.0697690954907145e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7907692498457469e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4771221315615626e+03, - "cpu_time": 9.4859246722362695e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1672734701438059e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3286877526460447e-03, - "cpu_time": 4.5842417309619311e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3282399854600594e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8690201203625670e+06, - "cpu_time": 2.0724493740053037e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7532181512119520e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8658787134073833e+06, - "cpu_time": 2.0744431671087488e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7561698820262846e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8698409099665419e+06, - "cpu_time": 2.0736714535809003e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7524485545984946e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8740250987909546e+06, - "cpu_time": 2.0773150583554374e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7485358131617658e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8636378169095884e+06, - "cpu_time": 2.0717073474801136e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7582815557122648e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8684805318874072e+06, - "cpu_time": 2.0739172801061007e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7537307913421523e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8690201203625672e+06, - "cpu_time": 2.0736714535809003e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7532181512119520e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9719439241561035e+03, - "cpu_time": 2.1748813405113347e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7267059511173873e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1257614710836329e-03, - "cpu_time": 1.0486827808291700e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1250159770903562e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8697246206519490e+06, - "cpu_time": 2.0776388700265258e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5051150996315405e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8651058856615259e+06, - "cpu_time": 2.0778952466843508e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5137951418106936e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8692548281260871e+06, - "cpu_time": 2.0774052811671009e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5059960265395872e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8754388123953873e+06, - "cpu_time": 2.0834742015915096e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4944355191356383e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8711968954091778e+06, - "cpu_time": 2.0790209363395199e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5023572431520700e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8701442084488254e+06, - "cpu_time": 2.0790869071618016e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5043398060539059e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8697246206519487e+06, - "cpu_time": 2.0778952466843512e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5051150996315405e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7246720854352302e+03, - "cpu_time": 2.5296954750703999e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9780544517257818e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9916496645596255e-03, - "cpu_time": 1.2167338779136136e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9912607903123081e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 371, - "real_time": 1.8738107309416889e+06, - "cpu_time": 2.0901815498652300e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9949433971983597e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 371, - "real_time": 1.8778901036189885e+06, - "cpu_time": 2.0945401051212894e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9797481624405876e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 371, - "real_time": 1.8702027491623953e+06, - "cpu_time": 2.0904080970350360e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0084379920146629e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 371, - "real_time": 1.8784433911661832e+06, - "cpu_time": 2.0955046684636089e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9776923071728736e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 371, - "real_time": 1.8744248239216181e+06, - "cpu_time": 2.0909626118598357e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9926517365350991e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8749543597621745e+06, - "cpu_time": 2.0923194064690000e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9906947190723166e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8744248239216183e+06, - "cpu_time": 2.0909626118598361e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9926517365350991e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3525374907899154e+03, - "cpu_time": 2.5070811064369054e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2505945937333169e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7880635191648941e-03, - "cpu_time": 1.1982305850079828e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7889417918957188e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8769197323265309e+06, - "cpu_time": 2.1097606058201012e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3966713412675357e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8803698822493153e+06, - "cpu_time": 2.1136976481481460e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3941086935854396e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8730606651549579e+06, - "cpu_time": 2.1091816322751283e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3995489034430867e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8724376018831714e+06, - "cpu_time": 2.1080763333333354e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4000146105608714e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8720892366165388e+06, - "cpu_time": 2.1082727089947090e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4002751304407778e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8749754236461029e+06, - "cpu_time": 2.1097977857142841e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3981237358595422e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8730606651549574e+06, - "cpu_time": 2.1091816322751283e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3995489034430867e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5818094174025018e+03, - "cpu_time": 2.2846888032722254e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6676311090553732e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9103233952993720e-03, - "cpu_time": 1.0828946824867063e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9080078827324678e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8904089203570038e+06, - "cpu_time": 2.1565853653333322e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7734105269720596e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8960174412156143e+06, - "cpu_time": 2.1599097360000126e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7652066305036598e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8959440943629793e+06, - "cpu_time": 2.1591997360000052e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7653136058115482e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8935455000028012e+06, - "cpu_time": 2.1590812213333379e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7688164873736823e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8908149468867728e+06, - "cpu_time": 2.1567121093333415e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7728149751684600e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8933461805650345e+06, - "cpu_time": 2.1582976336000063e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7691124451658815e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8935455000028019e+06, - "cpu_time": 2.1590812213333379e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7688164873736823e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6906857520969861e+03, - "cpu_time": 1.5388650392063330e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9356192422540067e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4211271978239078e-03, - "cpu_time": 7.1299945626105809e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4212565651223479e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 368, - "real_time": 1.9123107617222401e+06, - "cpu_time": 2.2356552608695612e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4832928883151054e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 368, - "real_time": 1.9077574329655718e+06, - "cpu_time": 2.2330040597826228e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4963801051479018e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 368, - "real_time": 1.9116922988399416e+06, - "cpu_time": 2.2362545353260930e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4850668208283293e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 368, - "real_time": 1.9055854068226283e+06, - "cpu_time": 2.2323042173913191e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5026449942665911e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 368, - "real_time": 1.9121385684348238e+06, - "cpu_time": 2.2358612445652266e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4837866737780893e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9098968937570411e+06, - "cpu_time": 2.2346158635869646e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4902342964672029e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9116922988399416e+06, - "cpu_time": 2.2356552608695612e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4850668208283293e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0512929795080904e+03, - "cpu_time": 1.8205895470775454e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7785843706146604e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5976218347084484e-03, - "cpu_time": 8.1472148155037620e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5989453084476577e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 360, - "real_time": 1.9559310999789482e+06, - "cpu_time": 2.4151188305555452e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0722013674318956e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 360, - "real_time": 1.9592205077060498e+06, - "cpu_time": 2.4175917472222252e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0704012089254042e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 360, - "real_time": 1.9648862417347524e+06, - "cpu_time": 2.4233646638889024e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0673147154557271e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 360, - "real_time": 1.9555652687106179e+06, - "cpu_time": 2.4142784222222203e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0724019461558223e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 360, - "real_time": 1.9528207561557388e+06, - "cpu_time": 2.4102811694444367e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0739091098808203e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9576847748572216e+06, - "cpu_time": 2.4161269666666659e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0712456695699339e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9559310999789480e+06, - "cpu_time": 2.4151188305555452e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0722013674318956e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6218492073225443e+03, - "cpu_time": 4.8253663928453334e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5253594924762691e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3608750840183792e-03, - "cpu_time": 1.9971493466266386e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3574046217522716e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 337, - "real_time": 2.0838907763682504e+06, - "cpu_time": 2.7911161364985155e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0127273691904917e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 337, - "real_time": 2.0852552620467430e+06, - "cpu_time": 2.7922532522255252e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0114103421003528e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 337, - "real_time": 2.0834477708152654e+06, - "cpu_time": 2.7917683946587555e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0131553373947763e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 337, - "real_time": 2.0847837630664872e+06, - "cpu_time": 2.7922711513353228e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0118652467969348e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 337, - "real_time": 2.0853316498428406e+06, - "cpu_time": 2.7919416587537094e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0113366621161196e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0845418444279176e+06, - "cpu_time": 2.7918701186943660e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0120989915197353e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0847837630664869e+06, - "cpu_time": 2.7919416587537099e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0118652467969348e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3847608939130009e+02, - "cpu_time": 4.7211581969369007e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0943588969108602e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0223519217548345e-04, - "cpu_time": 1.6910379051389315e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0228432751199798e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 317, - "real_time": 2.2075359525206005e+06, - "cpu_time": 3.4453625078864209e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.7999870355097728e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 317, - "real_time": 2.2235934693096001e+06, - "cpu_time": 3.4594887003154522e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.7725457084583745e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 317, - "real_time": 2.2076444266281715e+06, - "cpu_time": 3.4465603091482515e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.7998003205671463e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 317, - "real_time": 2.2130364831977696e+06, - "cpu_time": 3.4482001955835917e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.7905421187990174e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 317, - "real_time": 2.2065133214061526e+06, - "cpu_time": 3.4455348801261755e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.8017481782771034e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2116647306124587e+06, - "cpu_time": 3.4490293186119786e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.7929246723222828e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2076444266281715e+06, - "cpu_time": 3.4465603091482511e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.7998003205671463e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1400837098075062e+03, - "cpu_time": 5.9548030943671201e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2206396882212212e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2283752645593166e-03, - "cpu_time": 1.7265156495577605e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2182017669068648e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 211, - "real_time": 3.3299287127869390e+06, - "cpu_time": 5.6254639052132666e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0383108610029478e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 211, - "real_time": 3.3311412749167583e+06, - "cpu_time": 5.6207172180094672e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0364768754574194e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 211, - "real_time": 3.3304075107984776e+06, - "cpu_time": 5.6213563838862600e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0375865252530613e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 211, - "real_time": 3.3343183924995749e+06, - "cpu_time": 5.6216727156398231e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0316778498837185e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 211, - "real_time": 3.3298019591224561e+06, - "cpu_time": 5.6225503838862833e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0385026514974804e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3311195700248410e+06, - "cpu_time": 5.6223521213270202e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0365109526189260e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3304075107984771e+06, - "cpu_time": 5.6216727156398222e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0375865252530613e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8637465028597694e+03, - "cpu_time": 1.8606787082715546e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8161780116462810e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.5949552805931570e-04, - "cpu_time": 3.3094311208533607e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5915256377669584e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 105, - "real_time": 6.6690747315684957e+06, - "cpu_time": 1.0998439619047640e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0313474283273411e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 105, - "real_time": 6.6692529645349300e+06, - "cpu_time": 1.1004949257142827e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0312129676940317e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 105, - "real_time": 6.6869946329721380e+06, - "cpu_time": 1.1024764057142852e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0178643533748751e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 105, - "real_time": 6.6845869778522421e+06, - "cpu_time": 1.1025215085714312e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0196716881947193e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 105, - "real_time": 6.6685915170680908e+06, - "cpu_time": 1.0998481695238145e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0317120060687904e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6757001647991799e+06, - "cpu_time": 1.1010369942857157e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0263616887319517e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6692529645349290e+06, - "cpu_time": 1.1004949257142829e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0312129676940317e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2538652312413396e+03, - "cpu_time": 1.3607127578699317e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9638211105340719e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3862014474581661e-03, - "cpu_time": 1.2358465382470440e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3854596111030962e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52, - "real_time": 1.3532606687826606e+07, - "cpu_time": 2.2247601076922927e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9590493205103245e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52, - "real_time": 1.3166999910026789e+07, - "cpu_time": 2.1324687884615220e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.0967467501003017e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52, - "real_time": 1.3541086505238827e+07, - "cpu_time": 2.2288295134615328e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9559438213496876e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52, - "real_time": 1.3550086358848672e+07, - "cpu_time": 2.2289645923076928e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9526521250674982e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52, - "real_time": 1.3625597026055822e+07, - "cpu_time": 2.2349463750000078e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9252053962604151e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3483275297599345e+07, - "cpu_time": 2.2099938753846098e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9779194826576452e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3541086505238827e+07, - "cpu_time": 2.2288295134615328e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9559438213496876e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8064124312471267e+05, - "cpu_time": 4.3489876173645270e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7779322919259682e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3397430456446681e-02, - "cpu_time": 1.9678731537695615e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3615994223167548e-02, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27, - "real_time": 2.6144349878584895e+07, - "cpu_time": 4.2524824851851769e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1337183224410219e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27, - "real_time": 2.6134234197713710e+07, - "cpu_time": 4.2491634777777396e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1357054117063704e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27, - "real_time": 2.6145884422240432e+07, - "cpu_time": 4.2541174814815007e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1334170163251610e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27, - "real_time": 2.6152929912010830e+07, - "cpu_time": 4.2514185592592768e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1320340952835274e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27, - "real_time": 2.5940217836587518e+07, - "cpu_time": 4.1534037481481634e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1741172277548065e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6103523249427475e+07, - "cpu_time": 4.2321171503703721e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1417984147021780e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6144349878584895e+07, - "cpu_time": 4.2514185592592761e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1337183224410219e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1534312043962564e+04, - "cpu_time": 4.4038854389226495e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8114276317450829e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5065884083662988e-03, - "cpu_time": 1.0405868463582688e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5229456420648184e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.0922773778438568e+07, - "cpu_time": 8.0860656999999493e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2714225106421719e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.1001479104161263e+07, - "cpu_time": 8.0962874799999446e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2632876676335077e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 4.7256883978843689e+07, - "cpu_time": 7.9316505299999565e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.6803460871473284e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.0969207659363747e+07, - "cpu_time": 8.0894641700000137e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2666201482668076e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.0901831313967705e+07, - "cpu_time": 8.0809678300001055e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2735913241365061e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0210435166954994e+07, - "cpu_time": 8.0568871419999942e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3510535475652647e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0922773778438568e+07, - "cpu_time": 8.0860656999999493e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2714225106421719e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6515451671188357e+06, - "cpu_time": 7.0230203891479503e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8412422662543026e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2892468699529769e-02, - "cpu_time": 8.7167913182467603e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4408967316203923e-02, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0074732918292284e+08, - "cpu_time": 1.5863111749999881e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3288848087002411e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.9162756688892841e+07, - "cpu_time": 1.5542222600000066e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0212462236138887e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0075306985527277e+08, - "cpu_time": 1.5874722274999976e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3285811814090710e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.9142536744475365e+07, - "cpu_time": 1.5601317112500012e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0226120055224113e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0080764908343554e+08, - "cpu_time": 1.5874967499999925e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3256961835867004e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6122668310999870e+07, - "cpu_time": 1.5751268247499973e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6054040805664635e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0074732918292284e+08, - "cpu_time": 1.5863111749999881e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3288848087002411e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3627776551029887e+06, - "cpu_time": 1.6525495200811592e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8023593774932867e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.6194351102661392e-02, - "cpu_time": 1.0491533088730493e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7833813991676276e-02, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8587203696370125e+08, - "cpu_time": 2.8424355800000000e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7767797756996117e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8610463663935661e+08, - "cpu_time": 2.8453568625000256e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7695597669646111e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8616894632577896e+08, - "cpu_time": 2.8443631699999726e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7675667461803656e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8597462773323059e+08, - "cpu_time": 2.8430385625000197e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7735930814187088e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8613179028034210e+08, - "cpu_time": 2.8471290374999827e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7687180807898827e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8605040758848190e+08, - "cpu_time": 2.8444646425000000e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7712434902106361e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8610463663935661e+08, - "cpu_time": 2.8443631699999726e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7695597669646111e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2366692259828006e+05, - "cpu_time": 1.8745767993772443e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8373851523765502e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.6469578971207848e-04, - "cpu_time": 6.5902622636563300e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6491478983439934e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8620295801602665e+06, - "cpu_time": 2.0660710976253294e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1997502314906586e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8663027288535323e+06, - "cpu_time": 2.0705984089709762e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1947136103241770e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8618873145321007e+06, - "cpu_time": 2.0660708627968419e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1999183130099042e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8575317976215489e+06, - "cpu_time": 2.0665331266490684e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2050766534627653e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8622617377106489e+06, - "cpu_time": 2.0660174617414109e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1994760011744499e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8620026317756199e+06, - "cpu_time": 2.0670581915567252e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1997869618923911e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8620295801602665e+06, - "cpu_time": 2.0660710976253296e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1997502314906586e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1048491541061398e+03, - "cpu_time": 1.9900454490588406e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6686179908306731e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6674783918781751e-03, - "cpu_time": 9.6274282803819578e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6677151262296346e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8620746317125547e+06, - "cpu_time": 2.0672955733333158e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3993940202417113e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8668451953756933e+06, - "cpu_time": 2.0725968266666161e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3881517440718487e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8618399599799886e+06, - "cpu_time": 2.0668693573333409e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3999485326805692e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8572925563591223e+06, - "cpu_time": 2.0673934906666698e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4107213868658887e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8610975729534402e+06, - "cpu_time": 2.0671898826666016e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4017036608133512e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8618299832761600e+06, - "cpu_time": 2.0682690261333089e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3999838689346742e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8618399599799886e+06, - "cpu_time": 2.0672955733333162e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3999485326805692e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4035633057236446e+03, - "cpu_time": 2.4273263859334302e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0405274129936006e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8280741723444482e-03, - "cpu_time": 1.1736028317705792e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8273992933843133e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8625426740618423e+06, - "cpu_time": 2.0695588853332840e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7965769741370231e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8685057928863293e+06, - "cpu_time": 2.0756780746666361e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7685037222663425e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8634114011268441e+06, - "cpu_time": 2.0695991226666593e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7924759879070446e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8583831679037150e+06, - "cpu_time": 2.0699826426666733e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8162658180343956e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8625811110056627e+06, - "cpu_time": 2.0695126400000085e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7963954445741121e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8630848293968788e+06, - "cpu_time": 2.0708662730666525e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7940435893837828e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8625811110056627e+06, - "cpu_time": 2.0695991226666593e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7963954445741121e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6106363588962354e+03, - "cpu_time": 2.6963629492117398e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7033194754792406e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9379881699026428e-03, - "cpu_time": 1.3020459043059391e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9369013334610908e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8613665339390058e+06, - "cpu_time": 2.0760868597883033e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7604270519818939e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8701487881703998e+06, - "cpu_time": 2.0803249179894293e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7521600531077273e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8662884685716890e+06, - "cpu_time": 2.0759683333333293e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7557843040780324e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8608531161917006e+06, - "cpu_time": 2.0758662328042586e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7609127617262360e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8657610421036631e+06, - "cpu_time": 2.0751474497354405e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7562806415474180e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8648835897952914e+06, - "cpu_time": 2.0766787587301522e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7571129624882616e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8657610421036626e+06, - "cpu_time": 2.0759683333333291e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7562806415474180e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8431861854685931e+03, - "cpu_time": 2.0709075041223141e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6197743739035381e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0608182765394275e-03, - "cpu_time": 9.9722092086531114e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0600692449377566e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8623322989564359e+06, - "cpu_time": 2.0826821034483330e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5190282656174362e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8670215152990844e+06, - "cpu_time": 2.0824018169761004e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5101898646037601e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8623738841035413e+06, - "cpu_time": 2.0825956021220873e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5189496888561629e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8624617624248189e+06, - "cpu_time": 2.0824231061008151e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5187836508748434e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8673177443528720e+06, - "cpu_time": 2.0820959389920002e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5096330122815713e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8643014410273507e+06, - "cpu_time": 2.0824397135278676e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5153168964467548e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8624617624248192e+06, - "cpu_time": 2.0824231061008151e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5187836508748434e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6207967941801830e+03, - "cpu_time": 2.2524820186832721e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9392009171524900e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4057795249763658e-03, - "cpu_time": 1.0816553315088941e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4050513972566690e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8629849828864308e+06, - "cpu_time": 2.0957552015914645e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0355907967074722e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8728298764037886e+06, - "cpu_time": 2.1005798779840758e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9986068489939243e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8643184604147321e+06, - "cpu_time": 2.0958588196286543e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0305585007639751e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8679076523627513e+06, - "cpu_time": 2.0956313633952315e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0170492547746986e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8636322240141376e+06, - "cpu_time": 2.0954882572944032e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0331473297708809e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8663346392163683e+06, - "cpu_time": 2.0966627039787662e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0229905462021917e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8643184604147323e+06, - "cpu_time": 2.0957552015914645e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0305585007639751e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1003261726623296e+03, - "cpu_time": 2.1941417020004496e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5403442267882850e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1969940901830783e-03, - "cpu_time": 1.0464924557663476e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1932881963243620e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8760205580545983e+06, - "cpu_time": 2.1232041909814361e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3973407640683794e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8748907921313916e+06, - "cpu_time": 2.1224822546418696e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3981827693654224e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8761529725703313e+06, - "cpu_time": 2.1232494774536090e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3972421430053353e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8751114689922873e+06, - "cpu_time": 2.1226993183024111e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3980182209694448e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8761716441829400e+06, - "cpu_time": 2.1226479230769165e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3972282376869732e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8756694871863101e+06, - "cpu_time": 2.1228566328912484e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3976024270191112e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8760205580545985e+06, - "cpu_time": 2.1226993183024111e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3973407640683794e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1784318671492326e+02, - "cpu_time": 3.4770325429989595e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6042686009832221e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2939875118496981e-04, - "cpu_time": 1.6379026680965147e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2944051269311812e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 371, - "real_time": 1.8945118584801916e+06, - "cpu_time": 2.1805372506738324e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7674041608828586e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 371, - "real_time": 1.8971240610942356e+06, - "cpu_time": 2.1826350404312219e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7635936455183524e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 371, - "real_time": 1.9014419111858732e+06, - "cpu_time": 2.1834050592992064e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7573179959676868e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 371, - "real_time": 1.9017248193236354e+06, - "cpu_time": 2.1841183611859428e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7569078063905561e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 371, - "real_time": 1.8978045426178572e+06, - "cpu_time": 2.1831391671159235e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7626027244975924e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8985214385403588e+06, - "cpu_time": 2.1827669757412253e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7615652666514099e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8978045426178575e+06, - "cpu_time": 2.1831391671159235e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7626027244975924e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0550836595281266e+03, - "cpu_time": 1.3565581876916742e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4445069969570305e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6091910249256751e-03, - "cpu_time": 6.2148557439623768e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6094158811413154e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 371, - "real_time": 1.9005310616262679e+06, - "cpu_time": 2.2635313180593201e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5172789394072974e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 371, - "real_time": 1.8960488803252939e+06, - "cpu_time": 2.2624096684636381e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5303215591156173e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 371, - "real_time": 1.9005677159787770e+06, - "cpu_time": 2.2640181886792635e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5171725331553984e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 371, - "real_time": 1.8948171788423681e+06, - "cpu_time": 2.2605709919137750e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5339164733593130e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 371, - "real_time": 1.9005797695145111e+06, - "cpu_time": 2.2644697331536235e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5171375430763996e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8985089212574437e+06, - "cpu_time": 2.2629999800539245e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5231654096228063e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9005310616262681e+06, - "cpu_time": 2.2635313180593201e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5172789394072974e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8415164667824547e+03, - "cpu_time": 1.5594625852383419e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2718819208206784e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4967095676855847e-03, - "cpu_time": 6.8911294696572738e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4976705036588050e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 362, - "real_time": 1.9423320459508086e+06, - "cpu_time": 2.4542321602210086e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0797082838497906e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 362, - "real_time": 1.9412248801229040e+06, - "cpu_time": 2.4544938674033331e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0803240889160786e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 362, - "real_time": 1.9442891997596486e+06, - "cpu_time": 2.4570440662983614e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0786214315541372e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 362, - "real_time": 1.9409769301197249e+06, - "cpu_time": 2.4538311878452739e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0804620948640754e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 362, - "real_time": 1.9426281759785539e+06, - "cpu_time": 2.4544928425414581e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0795436954596875e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9422902463863280e+06, - "cpu_time": 2.4548188248618869e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0797319189287539e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9423320459508083e+06, - "cpu_time": 2.4544928425414581e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0797082838497906e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3201858853342153e+03, - "cpu_time": 1.2731028586945602e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3365371450024028e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7970576889342317e-04, - "cpu_time": 5.1861377540405142e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7947765703557986e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 355, - "real_time": 1.9792456597968622e+06, - "cpu_time": 2.8004079492958020e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1191427043121459e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 355, - "real_time": 1.9787115520391033e+06, - "cpu_time": 2.8011053154928912e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1197147182355518e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 355, - "real_time": 1.9802218432616915e+06, - "cpu_time": 2.8021416253520655e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1180980374862535e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 355, - "real_time": 1.9839905858249732e+06, - "cpu_time": 2.8015465633802866e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1140745475140171e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 355, - "real_time": 1.9838702881341458e+06, - "cpu_time": 2.8022253887323928e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1142027405152550e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9812079858113553e+06, - "cpu_time": 2.8014853684506877e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1170465496126451e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9802218432616915e+06, - "cpu_time": 2.8015465633802870e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.1180980374862535e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5439191510190753e+03, - "cpu_time": 7.5619445940504795e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7174740901064724e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2840242767229084e-03, - "cpu_time": 2.6992625694962952e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2836156534223053e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 346, - "real_time": 2.0404579037143660e+06, - "cpu_time": 3.5445938554912875e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1111399479154758e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 346, - "real_time": 2.0422382684656002e+06, - "cpu_time": 3.5487322861272171e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1075559740160155e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 346, - "real_time": 2.0406886429197527e+06, - "cpu_time": 3.5443135895954324e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1106751042617874e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 346, - "real_time": 2.0444116678298856e+06, - "cpu_time": 3.5505559393063178e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1031892607541175e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 346, - "real_time": 2.0422724538585010e+06, - "cpu_time": 3.5454258236993910e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1074872180502934e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0420137873576214e+06, - "cpu_time": 3.5467242988439291e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1080095009995384e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0422382684656004e+06, - "cpu_time": 3.5454258236993914e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1075559740160155e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5846066213547249e+03, - "cpu_time": 2.7726263371002556e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1866252076075720e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7600192083189415e-04, - "cpu_time": 7.8174284310850021e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7571028178786343e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 191, - "real_time": 3.6291871305204029e+06, - "cpu_time": 6.5832194293194013e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6228577906354065e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 191, - "real_time": 3.6453806395345023e+06, - "cpu_time": 6.6126901780105513e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6023221328520498e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 191, - "real_time": 3.6544721434624251e+06, - "cpu_time": 6.6320722565445388e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5908725915487337e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 191, - "real_time": 3.6376444817915638e+06, - "cpu_time": 6.5958894345549764e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6121098650457211e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 191, - "real_time": 3.6369575558142513e+06, - "cpu_time": 6.5918416806283779e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6129809717407808e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6407283902246295e+06, - "cpu_time": 6.6031425958115701e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6082286703645382e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6376444817915643e+06, - "cpu_time": 6.5958894345549773e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6121098650457211e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5846822538967863e+03, - "cpu_time": 1.9399311786960308e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2122085811384112e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6326276575950286e-03, - "cpu_time": 2.9378907854065517e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6305304442336155e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 98, - "real_time": 7.2721128865164155e+06, - "cpu_time": 1.3348374142857287e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6141241924633675e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 98, - "real_time": 7.2923300607243972e+06, - "cpu_time": 1.3401546673469337e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6013320462166252e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 98, - "real_time": 7.2725259185749656e+06, - "cpu_time": 1.3344556663265238e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6138621402912664e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 98, - "real_time": 7.2736377846829742e+06, - "cpu_time": 1.3375013418367393e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6131568540104980e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 98, - "real_time": 7.2791936275150096e+06, - "cpu_time": 1.3358945295918515e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6096358631216822e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2779600556027535e+06, - "cpu_time": 1.3365687238775555e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6104222192206879e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2736377846829761e+06, - "cpu_time": 1.3358945295918517e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6131568540104980e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5208568270402502e+03, - "cpu_time": 2.3262496573827611e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3913238507809937e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1707754318438012e-03, - "cpu_time": 1.7404639326244410e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1693774657567705e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4378109699761381e+07, - "cpu_time": 2.5923098142857041e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6674330215406370e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4371004392754059e+07, - "cpu_time": 2.5948479244897734e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6697406921562605e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4378805150639039e+07, - "cpu_time": 2.5937488020408452e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6672072746613083e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4390393768494226e+07, - "cpu_time": 2.6003897142857112e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6634487616958447e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4401979079203947e+07, - "cpu_time": 2.5988555061224602e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6596973673502493e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4384058418170532e+07, - "cpu_time": 2.5960303522448990e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6655054234808607e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4378805150639037e+07, - "cpu_time": 2.5948479244897738e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6672072746613083e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2193014451121184e+04, - "cpu_time": 3.4435280335482137e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9532520206230213e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4767553750466349e-04, - "cpu_time": 1.3264590803302612e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4733628230862967e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.3682550415396690e+07, - "cpu_time": 4.8034341600000516e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.6673679838443956e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.7867418080568314e+07, - "cpu_time": 4.9467176279999875e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8162957763779612e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.7814221158623695e+07, - "cpu_time": 4.9436798119999141e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8255073271532640e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.7814285308122635e+07, - "cpu_time": 4.9405407199999444e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8254961978406200e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.7785082012414932e+07, - "cpu_time": 4.9410874279999465e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8305679983247423e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6992711395025253e+07, - "cpu_time": 4.9150919495999686e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9930470567081966e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7814221158623695e+07, - "cpu_time": 4.9410874279999457e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8255073271532640e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8506749227282566e+06, - "cpu_time": 6.2466623490715411e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7699205017214501e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8562023860609084e-02, - "cpu_time": 1.2709146467910831e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5503404211993821e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 5.4358589897553124e+07, - "cpu_time": 9.4568923266666621e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9382343527657118e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 5.4310600956281029e+07, - "cpu_time": 9.4676272666667193e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9425977852111282e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 5.4265800118446350e+07, - "cpu_time": 9.4654718266665831e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9466783022471609e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.6106208612521492e+07, - "cpu_time": 9.2189426066666633e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.8221108193029451e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 5.4321917643149696e+07, - "cpu_time": 9.4597465399999693e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9415681118512802e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2672623445590340e+07, - "cpu_time": 9.4137361133333191e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.1182378742756453e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4310600956281021e+07, - "cpu_time": 9.4597465399999693e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9425977852111282e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6708868214525143e+06, - "cpu_time": 1.0897794363138289e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9348847603635335e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.9692500227266252e-02, - "cpu_time": 1.1576481677346996e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6879677283862372e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 9.8979412578046322e+07, - "cpu_time": 1.7097006399999869e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4240664600496750e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0547426249831915e+08, - "cpu_time": 1.7943084687500033e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0900655693947668e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 9.9149235524237156e+07, - "cpu_time": 1.7134094625000173e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4147761115995817e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0562058165669441e+08, - "cpu_time": 1.7982337724999908e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0830141585948391e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 9.8844932392239571e+07, - "cpu_time": 1.7151549749999973e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4314459933016291e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0161368492990732e+08, - "cpu_time": 1.7461614637499991e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2886736585880985e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9149235524237156e+07, - "cpu_time": 1.7151549749999970e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4147761115995817e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5929852787266038e+06, - "cpu_time": 4.5807060121874809e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8463340836179870e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5359265646207290e-02, - "cpu_time": 2.6233003689991572e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4911098751948658e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8292541056871414e+08, - "cpu_time": 3.1230585424999899e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8698341617041740e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8355449289083481e+08, - "cpu_time": 3.1407167049999887e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8497169265074072e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8357677012681961e+08, - "cpu_time": 3.1400849925000787e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8490070571468887e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8293696641921997e+08, - "cpu_time": 3.1246936350000000e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8694633731894503e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8394868820905685e+08, - "cpu_time": 3.1365027200000381e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8371811968547297e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8338846564292911e+08, - "cpu_time": 3.1330113190000188e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8550405430805302e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8355449289083481e+08, - "cpu_time": 3.1365027200000381e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8497169265074072e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4585437646018929e+05, - "cpu_time": 8.5123636306110187e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4235249153742269e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4312018473849968e-03, - "cpu_time": 2.7169910236162051e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4312810558699623e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8614930960069911e+06, - "cpu_time": 2.0739697730871171e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2003842016852782e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8582981641390200e+06, - "cpu_time": 2.0699264564643695e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2041672746836855e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8537218814087899e+06, - "cpu_time": 2.0705608680738846e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2096087018658514e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8579207630012501e+06, - "cpu_time": 2.0697414432718228e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2046150091909189e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8541964087288182e+06, - "cpu_time": 2.0712860580475368e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2090432171681831e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8571260626569740e+06, - "cpu_time": 2.0710969197889466e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2055636809187839e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8579207630012501e+06, - "cpu_time": 2.0705608680738849e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2046150091909189e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2112175616108557e+03, - "cpu_time": 1.7163705729655067e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8126860780025586e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7291327854268518e-03, - "cpu_time": 8.2872537570111008e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7286674200285557e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8623628774596576e+06, - "cpu_time": 2.0757418394735719e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3987131074982760e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8585401155992018e+06, - "cpu_time": 2.0711783552630586e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4077606564649595e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8532361039864267e+06, - "cpu_time": 2.0715131921051759e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4203757861065278e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8581375895193655e+06, - "cpu_time": 2.0709094026314965e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4087155042802729e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8538765233020775e+06, - "cpu_time": 2.0720048289474023e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4188487728452478e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8572306419733458e+06, - "cpu_time": 2.0722695236841410e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4108827654390577e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8581375895193655e+06, - "cpu_time": 2.0715131921051755e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4087155042802729e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7444479534340185e+03, - "cpu_time": 1.9836617343068106e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8898801332852454e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0161459049886587e-03, - "cpu_time": 9.5724118491121715e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0154423969144758e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8599496800040873e+06, - "cpu_time": 2.0743481846965980e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8088404628043473e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8539313016876169e+06, - "cpu_time": 2.0740189155673166e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8374364169188980e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8548030863297333e+06, - "cpu_time": 2.0744920976254449e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8332826922455169e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8589977068987205e+06, - "cpu_time": 2.0738731002638203e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8133513770345990e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8547414450311547e+06, - "cpu_time": 2.0747163693931666e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8335762614744361e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8564846439902626e+06, - "cpu_time": 2.0742897335092698e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8252974420955610e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8548030863297333e+06, - "cpu_time": 2.0743481846965980e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8332826922455169e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7707352566440818e+03, - "cpu_time": 3.4398821412745860e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3164330762103424e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4924633314977287e-03, - "cpu_time": 1.6583421716382003e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4916585926397470e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8616551092752416e+06, - "cpu_time": 2.0792250422163433e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7601541680164840e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8574482774992269e+06, - "cpu_time": 2.0796813350922444e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7641406437500998e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8620903701526064e+06, - "cpu_time": 2.0795567968338637e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7597427345760088e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8658995648552994e+06, - "cpu_time": 2.0837219762533479e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7561502568087664e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8570007548286915e+06, - "cpu_time": 2.0796031398416767e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7645657878595129e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8608188153222133e+06, - "cpu_time": 2.0803576580474954e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7609507182021748e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8616551092752418e+06, - "cpu_time": 2.0796031398416769e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7601541680164840e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6765597446994498e+03, - "cpu_time": 1.8887525480084423e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4778765019045743e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9757752417517488e-03, - "cpu_time": 9.0789799566537866e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9749993375483429e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8630398779774266e+06, - "cpu_time": 2.0856138915343350e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5176917453397669e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8582286098708643e+06, - "cpu_time": 2.0867081693121349e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5267996441274442e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8634133773274403e+06, - "cpu_time": 2.0864037857143586e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5169866652987950e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8697021441959478e+06, - "cpu_time": 2.0924977883597931e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5051572360571526e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8586250096237687e+06, - "cpu_time": 2.0870497037036191e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5260474630794995e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8626018037990897e+06, - "cpu_time": 2.0876546677248483e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5185365507805318e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8630398779774266e+06, - "cpu_time": 2.0867081693121349e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5176917453397669e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6423353868145196e+03, - "cpu_time": 2.7589459699769623e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7580594158323685e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4923928331571977e-03, - "cpu_time": 1.3215528471400377e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4891199194419429e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8612166646576799e+06, - "cpu_time": 2.0994626200526822e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0422752218429729e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8586291872286841e+06, - "cpu_time": 2.1000012031662972e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0520790753014803e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8663992168440786e+06, - "cpu_time": 2.1038825778364874e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0227204778638706e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8573637392035855e+06, - "cpu_time": 2.0992380316623184e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0568837559089020e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8616440052232314e+06, - "cpu_time": 2.0994431688654255e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0406586668691814e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8610505626314520e+06, - "cpu_time": 2.1004055203166427e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0429234395572826e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8612166646576799e+06, - "cpu_time": 2.0994626200526827e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0422752218429729e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4800715403122726e+03, - "cpu_time": 1.9641545466715093e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3156986178452877e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8699500218798939e-03, - "cpu_time": 9.3513111047975475e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8681143265813951e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8639245628468127e+06, - "cpu_time": 2.1245473421052005e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4064088495063433e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8697506900934968e+06, - "cpu_time": 2.1283672473683017e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4020264914938551e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8650634839631445e+06, - "cpu_time": 2.1230272578947050e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4055500107854787e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8616714687883167e+06, - "cpu_time": 2.1233943105262127e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4081109604726255e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8617283248443673e+06, - "cpu_time": 2.1233773842105186e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4080679576162875e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8644277061072276e+06, - "cpu_time": 2.1245427084209877e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4060328539749178e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8639245628468127e+06, - "cpu_time": 2.1233943105262131e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4064088495063433e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3119114004894595e+03, - "cpu_time": 2.2136230577013457e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4942746422557402e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7763689037878863e-03, - "cpu_time": 1.0419291873621898e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7739803413585353e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 369, - "real_time": 1.8965110043079534e+06, - "cpu_time": 2.1911352439024467e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7644869911594075e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 369, - "real_time": 1.8947917559792395e+06, - "cpu_time": 2.1898564715446029e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7669953616039711e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 369, - "real_time": 1.8935481432306664e+06, - "cpu_time": 2.1877738915987918e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7688126223476368e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 369, - "real_time": 1.8920101629043892e+06, - "cpu_time": 2.1880566747967508e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7710633392961025e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 369, - "real_time": 1.8893850678300390e+06, - "cpu_time": 2.1855891978320205e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7749134304429823e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8932492268504580e+06, - "cpu_time": 2.1884822959349230e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7692543489700198e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8935481432306662e+06, - "cpu_time": 2.1880566747967508e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7688126223476368e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7191424979458152e+03, - "cpu_time": 2.1201119198554420e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9788030845971755e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4362306131608909e-03, - "cpu_time": 9.6875899969285661e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4367777687437878e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8860565413037436e+06, - "cpu_time": 2.2678474704300682e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5596212363557673e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8875528913540815e+06, - "cpu_time": 2.2664451854838426e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5552138687238514e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8865735257878117e+06, - "cpu_time": 2.2677685026881699e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5580977134836364e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8874002232996156e+06, - "cpu_time": 2.2671739193548723e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5556632189374483e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8850802139583125e+06, - "cpu_time": 2.2654003252688241e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5625006948547220e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8865326791407131e+06, - "cpu_time": 2.2669270806451556e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5582193464710844e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8865735257878122e+06, - "cpu_time": 2.2671739193548718e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5580977134836364e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0163041645023334e+03, - "cpu_time": 1.0221598064346583e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9948588574422000e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.3871537754927434e-04, - "cpu_time": 4.5090105242545203e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3881624145395363e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 365, - "real_time": 1.9295984689363162e+06, - "cpu_time": 2.4687249452054631e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0868333665065804e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 365, - "real_time": 1.9302401965968821e+06, - "cpu_time": 2.4685210849315496e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0864720378828461e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 365, - "real_time": 1.9319883860290458e+06, - "cpu_time": 2.4706322219178020e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0854889269341969e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 365, - "real_time": 1.9322855874883293e+06, - "cpu_time": 2.4700561260274672e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0853219697850003e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 365, - "real_time": 1.9301783799015188e+06, - "cpu_time": 2.4701498383561336e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0865068336880865e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9308582037904183e+06, - "cpu_time": 2.4696168432876831e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0861246269593420e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9302401965968818e+06, - "cpu_time": 2.4700561260274672e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0864720378828461e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1985158974657877e+03, - "cpu_time": 9.3597748308502253e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7406623199801368e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.2071668189461651e-04, - "cpu_time": 3.7899704386490997e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2061591760891608e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 347, - "real_time": 2.0247974472592778e+06, - "cpu_time": 2.8868662507204688e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0714684353624210e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 347, - "real_time": 2.0209131423539622e+06, - "cpu_time": 2.8857238213255391e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0754499102888064e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 347, - "real_time": 2.0248200254573859e+06, - "cpu_time": 2.8886633141210843e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0714453370010254e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 347, - "real_time": 2.0287674806424300e+06, - "cpu_time": 2.8859885821325746e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0674148417796161e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 347, - "real_time": 2.0285526106686946e+06, - "cpu_time": 2.8860097146973731e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0676338281497095e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0255701412763502e+06, - "cpu_time": 2.8866503365994082e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0706824705163159e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0248200254573859e+06, - "cpu_time": 2.8860097146973731e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0714453370010254e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2390381072339746e+03, - "cpu_time": 1.2047243820984947e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3128464284599731e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5990747697302624e-03, - "cpu_time": 4.1734337090432270e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5998814282877126e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 340, - "real_time": 2.0682839779457187e+06, - "cpu_time": 3.6422773176470250e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0558299002692151e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 340, - "real_time": 2.0627150192226775e+06, - "cpu_time": 3.6402054911765363e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0667799098884726e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 340, - "real_time": 2.0673047110904006e+06, - "cpu_time": 3.6409371264707102e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0577511167066536e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 340, - "real_time": 2.0613211508402054e+06, - "cpu_time": 3.6403527705882718e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0695298724222374e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 340, - "real_time": 2.0684482372256324e+06, - "cpu_time": 3.6409476764706527e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0555078193551846e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0656146192649272e+06, - "cpu_time": 3.6409440764706396e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0610797237283525e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0673047110904008e+06, - "cpu_time": 3.6409371264707097e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0577511167066536e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3486127131336807e+03, - "cpu_time": 8.1742647343152566e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5875550209891982e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6211217145264605e-03, - "cpu_time": 2.2450948332716509e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6221191084969310e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 190, - "real_time": 3.6918336121169361e+06, - "cpu_time": 6.7958967052633353e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5444128210262890e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 190, - "real_time": 3.6965670676803901e+06, - "cpu_time": 6.7971149421052095e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5385936986469355e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 190, - "real_time": 3.6937796964163058e+06, - "cpu_time": 6.7927384631577516e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5420185768732243e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 190, - "real_time": 3.6935919344327166e+06, - "cpu_time": 6.7973121000001784e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5422494682203550e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 190, - "real_time": 3.6944508417754583e+06, - "cpu_time": 6.7886599631579332e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5411934597395544e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6940446304843621e+06, - "cpu_time": 6.7943444347368823e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5416936049012718e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6937796964163058e+06, - "cpu_time": 6.7958967052633343e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5420185768732243e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7096361465518899e+03, - "cpu_time": 3.6669010690414457e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1016833213783661e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6280874151965047e-04, - "cpu_time": 5.3969902530904732e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6275321591713865e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 96, - "real_time": 7.4275628673300771e+06, - "cpu_time": 1.3940494541666718e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5175561081533499e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 96, - "real_time": 7.4316029398081200e+06, - "cpu_time": 1.3929907906250112e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5151002107852602e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 96, - "real_time": 7.4237279137984542e+06, - "cpu_time": 1.3937892781250127e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5198897898227806e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 96, - "real_time": 7.4253645580029115e+06, - "cpu_time": 1.3928573624999886e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5188935489821434e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 96, - "real_time": 7.4166796063461034e+06, - "cpu_time": 1.3941492864583202e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5241851854149199e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4249875770571334e+06, - "cpu_time": 1.3935672343750011e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5191249686316910e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4253645580029115e+06, - "cpu_time": 1.3937892781250129e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5188935489821434e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5033259883205019e+03, - "cpu_time": 6.0349595167781536e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3505335140541424e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.4118992539806043e-04, - "cpu_time": 4.3305836761329733e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4141200726047260e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.3907604907848397e+07, - "cpu_time": 2.5790038448979065e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.8253358104909096e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4560561075958671e+07, - "cpu_time": 2.6734471714286085e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6089476669141016e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4544796084566992e+07, - "cpu_time": 2.6761264244897828e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6139432694561472e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4533648115335679e+07, - "cpu_time": 2.6762006857142974e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6174823738293056e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4528139608398993e+07, - "cpu_time": 2.6756905448978938e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6192331440154314e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4414949958421748e+07, - "cpu_time": 2.6560937342856981e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6569884529411783e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4533648115335679e+07, - "cpu_time": 2.6756905448978938e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6174823738293056e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8388499594164902e+05, - "cpu_time": 4.3109239106069022e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4191070935944661e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9693789902877384e-02, - "cpu_time": 1.6230315425092616e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0225747151349952e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.8250244781374931e+07, - "cpu_time": 5.0926624999999598e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7510288508540020e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.8210705146193504e+07, - "cpu_time": 5.0918302199997924e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7576878105122490e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8256638273596764e+07, - "cpu_time": 5.0917501080000423e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7499538586447544e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.5656550377607346e+07, - "cpu_time": 4.8216757920001782e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2313240098381748e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.8195153325796127e+07, - "cpu_time": 5.0973466840000585e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7603120454465618e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7713858380913734e+07, - "cpu_time": 5.0390530608000070e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8500613150591497e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8210705146193504e+07, - "cpu_time": 5.0918302199997917e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7576878105122490e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1503627835499351e+06, - "cpu_time": 1.2153950261621033e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1317713876297036e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1508575519826514e-02, - "cpu_time": 2.4119512366657749e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3953493557095477e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.4916159436106682e+07, - "cpu_time": 9.5273730099995643e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8880959403637228e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.4751246422529221e+07, - "cpu_time": 9.5207077999998540e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9028190870471821e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.2524373307824135e+07, - "cpu_time": 9.3036697299999103e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.1106836520791636e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.4848048090934753e+07, - "cpu_time": 9.5306631799996927e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8941660705035524e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.4966976121068001e+07, - "cpu_time": 9.5487843899996966e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8835769209635096e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4401360675692558e+07, - "cpu_time": 9.4862396219997436e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9358683341914253e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4848048090934753e+07, - "cpu_time": 9.5273730099995643e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8941660705035524e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0523746787246561e+06, - "cpu_time": 1.0258786097457698e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7990204116452381e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9344638914424703e-02, - "cpu_time": 1.0814386423115777e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9852677883982647e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0733332578092813e+08, - "cpu_time": 1.8380291100000080e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0019032587863369e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 9.7974468953907490e+07, - "cpu_time": 1.7467051412499756e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4797021890730867e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0764140449464321e+08, - "cpu_time": 1.8396626250000027e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9875873927928677e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 9.8030170425772667e+07, - "cpu_time": 1.7461907624999639e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4765885815378904e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0734210442751646e+08, - "cpu_time": 1.8381613212500268e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0014941933854666e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0366429481655359e+08, - "cpu_time": 1.8017497919999957e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1894551231151304e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0733332578092813e+08, - "cpu_time": 1.8380291100000077e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0019032587863369e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1701776841231920e+06, - "cpu_time": 5.0487846602264177e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6360224567825699e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9874237733179408e-02, - "cpu_time": 2.8021563719022924e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0795746263245768e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.9336525723338127e+08, - "cpu_time": 3.1322833524998826e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5529201024155674e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.9433301687240601e+08, - "cpu_time": 3.1428466500000238e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5252670970728092e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.9411337375640869e+08, - "cpu_time": 3.1301560374998873e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5315190459129829e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.9396562129259109e+08, - "cpu_time": 3.1196299350000346e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5357326563571482e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.9358805567026138e+08, - "cpu_time": 3.1243790950000519e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5465293056556387e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9387306496500969e+08, - "cpu_time": 3.1298590139999759e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5383936414828300e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9396562129259109e+08, - "cpu_time": 3.1301560374998868e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5357326563571482e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9273710560644453e+05, - "cpu_time": 8.7935757577041106e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1223348129894216e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0257435228422573e-03, - "cpu_time": 2.8095756768500174e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0264626995507881e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8504813195350140e+06, - "cpu_time": 2.0678760629921700e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2134781674149707e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8534999333286604e+06, - "cpu_time": 2.0680929028871467e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2098732923308406e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8575889615241496e+06, - "cpu_time": 2.0725746456692948e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2050087962620305e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8581500223795322e+06, - "cpu_time": 2.0725092204725235e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2043430028080805e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8530497355901469e+06, - "cpu_time": 2.0674294278215377e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2104101802186831e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8545539944715009e+06, - "cpu_time": 2.0696964519685346e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2086226878069211e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8534999333286602e+06, - "cpu_time": 2.0680929028871465e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2098732923308406e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2443397841836686e+03, - "cpu_time": 2.6086514621199281e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8636362020962115e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7493908475327087e-03, - "cpu_time": 1.2604029250950213e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7493418968418984e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8496196565377575e+06, - "cpu_time": 2.0702376421052362e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4290186747551858e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8533358911602255e+06, - "cpu_time": 2.0689556315789418e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4201377845608136e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8599131179814178e+06, - "cpu_time": 2.0753212078948249e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4045068131412817e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8581607345703035e+06, - "cpu_time": 2.0737690578946993e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4086605897925114e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8526504065352797e+06, - "cpu_time": 2.0686603394735630e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4217732450237097e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8547359613569968e+06, - "cpu_time": 2.0713887757894532e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4168194214547006e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8533358911602255e+06, - "cpu_time": 2.0702376421052362e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4201377845608136e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2136187757805164e+03, - "cpu_time": 2.9924667668009606e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0031706488834539e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2718159692647947e-03, - "cpu_time": 1.4446668832896730e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2712512175855604e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8502676378327457e+06, - "cpu_time": 2.0717495842105611e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8549351807238515e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8549350179359624e+06, - "cpu_time": 2.0719598999999347e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8326544280947000e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8590845058880451e+06, - "cpu_time": 2.0761745947368126e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8129398895580117e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8541636607742952e+06, - "cpu_time": 2.0695674368421410e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8363289318042565e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8507021717500479e+06, - "cpu_time": 2.0698129500000339e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8528560943477340e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8538305988362194e+06, - "cpu_time": 2.0718528931578968e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8379429049057104e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8541636607742955e+06, - "cpu_time": 2.0717495842105609e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8363289318042565e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5852460953906002e+03, - "cpu_time": 2.6497125502306067e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7079697959355501e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9339664032092861e-03, - "cpu_time": 1.2789095977716555e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9325422378407772e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8533583664265277e+06, - "cpu_time": 2.0752989155671864e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7680336730116688e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8579734733594228e+06, - "cpu_time": 2.0749868258575299e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7636419717420299e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8651177554345555e+06, - "cpu_time": 2.0817664591029736e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7568863898550656e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8597398110732036e+06, - "cpu_time": 2.0769731899735963e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7619669055259138e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8551331479371141e+06, - "cpu_time": 2.0774786279683411e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7663422184244633e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8582645108461652e+06, - "cpu_time": 2.0773008036939255e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7633742317118283e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8579734733594228e+06, - "cpu_time": 2.0769731899735965e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7636419717420299e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5580659741454074e+03, - "cpu_time": 2.7130739001951306e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3204074469675310e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4528617683549701e-03, - "cpu_time": 1.3060573102223094e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4500797217465375e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8591918322699401e+06, - "cpu_time": 2.0870676728231404e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5249724564455107e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8614365036662612e+06, - "cpu_time": 2.0845807915566603e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5207217582185119e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8667608352587188e+06, - "cpu_time": 2.0900179604221992e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5106800379662566e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8611359189213486e+06, - "cpu_time": 2.0842849841688913e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5212903761474036e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8541161442423698e+06, - "cpu_time": 2.0827167651714443e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5346221542544939e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8605282468717278e+06, - "cpu_time": 2.0857336348284674e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5224573566064350e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8611359189213484e+06, - "cpu_time": 2.0845807915566601e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5212903761474036e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5535814981671010e+03, - "cpu_time": 2.8576319757275801e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6224620691757751e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4474670061169156e-03, - "cpu_time": 1.3700848123699143e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4478542097902721e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8573123110073686e+06, - "cpu_time": 2.0988705593667706e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0570791580501184e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8650687662967527e+06, - "cpu_time": 2.1026983509233827e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0277301496102065e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8596718064217526e+06, - "cpu_time": 2.0965262427440372e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0481253491818726e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8647491946428802e+06, - "cpu_time": 2.1011996807387588e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0289345278468788e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8563531971543336e+06, - "cpu_time": 2.0970605699208400e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0607253081431210e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8606310551046177e+06, - "cpu_time": 2.0992710807387577e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0445188985664397e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8596718064217526e+06, - "cpu_time": 2.0988705593667706e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0481253491818726e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0892127279724627e+03, - "cpu_time": 2.6479515638581188e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5476991131192134e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1977558187872654e-03, - "cpu_time": 1.2613671422207530e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1970259934062644e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8605822996404539e+06, - "cpu_time": 2.1202308359788815e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4089352567239714e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8677277225328402e+06, - "cpu_time": 2.1238942936508558e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4035450501559427e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8696075203479268e+06, - "cpu_time": 2.1260318227513423e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4021338550842801e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8729192813259067e+06, - "cpu_time": 2.1296740026454423e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3996545532620010e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8682238037134989e+06, - "cpu_time": 2.1251334179894566e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4031723580383256e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8678121255121254e+06, - "cpu_time": 2.1249928746031956e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4034882146529040e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8682238037134986e+06, - "cpu_time": 2.1251334179894566e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4031723580383256e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5208812209660682e+03, - "cpu_time": 3.4240333457698325e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4023709565536794e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4204153936127344e-03, - "cpu_time": 1.6113152127200472e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4242248143103349e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8981340258652645e+06, - "cpu_time": 2.1937296774193104e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7621231844311064e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8935422392709742e+06, - "cpu_time": 2.1903093897849103e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7688212553518438e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8921822297915076e+06, - "cpu_time": 2.1885848333332976e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7708113507533008e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8900187679200922e+06, - "cpu_time": 2.1860198064516876e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7739830360360008e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8888032625577042e+06, - "cpu_time": 2.1859093602149482e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7757681829183239e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8925361050811086e+06, - "cpu_time": 2.1889106134408312e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7703014018981153e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8921822297915076e+06, - "cpu_time": 2.1885848333332976e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7708113507533008e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6312997164066705e+03, - "cpu_time": 3.2653625961898151e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3097609931144735e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9187479206643951e-03, - "cpu_time": 1.4917752128109374e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9166726730443148e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 371, - "real_time": 1.8875228523965823e+06, - "cpu_time": 2.2691417088948111e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5553022771015775e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 371, - "real_time": 1.8938452286540337e+06, - "cpu_time": 2.2721630943396292e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5367565634982157e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 371, - "real_time": 1.8886656962765625e+06, - "cpu_time": 2.2697946873315927e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5519407276111937e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 371, - "real_time": 1.8929680459505082e+06, - "cpu_time": 2.2715049838275644e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5393222418262362e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 371, - "real_time": 1.8892341100101201e+06, - "cpu_time": 2.2704819056603550e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5502703155956841e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8904471866575617e+06, - "cpu_time": 2.2706172760107908e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5467184251265812e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8892341100101203e+06, - "cpu_time": 2.2704819056603555e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5502703155956841e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7882976339404113e+03, - "cpu_time": 1.2298226550484906e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1779138288441265e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4749407725429822e-03, - "cpu_time": 5.4162481191420567e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4743697447842773e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 363, - "real_time": 1.9346682493351707e+06, - "cpu_time": 2.4699820275481977e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0839853296401930e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 363, - "real_time": 1.9326389344863226e+06, - "cpu_time": 2.4694064573003626e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0851235388970385e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 363, - "real_time": 1.9328337478305190e+06, - "cpu_time": 2.4692152975207181e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0850141675940404e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 363, - "real_time": 1.9321390700246880e+06, - "cpu_time": 2.4704799311295459e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0854042716362045e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 363, - "real_time": 1.9326988750678739e+06, - "cpu_time": 2.4691993471073695e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0850898849549706e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9329957753489148e+06, - "cpu_time": 2.4696566121212384e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0849234385444894e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9326988750678736e+06, - "cpu_time": 2.4694064573003622e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0850898849549706e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7119145138014972e+02, - "cpu_time": 5.5905650371350498e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4479929720953200e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0242812931386015e-04, - "cpu_time": 2.2637013622445266e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0215460174814121e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 346, - "real_time": 2.0266216742197815e+06, - "cpu_time": 2.8861040375722703e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0696038403984518e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 346, - "real_time": 2.0234231168210420e+06, - "cpu_time": 2.8843423208092838e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0728753986905041e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 346, - "real_time": 2.0310651938931618e+06, - "cpu_time": 2.8853202543353089e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0650760067235088e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 346, - "real_time": 2.0290480824348899e+06, - "cpu_time": 2.8846203901734939e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0671289341585088e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 346, - "real_time": 2.0275683030539940e+06, - "cpu_time": 2.8850381676301565e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0686375860593171e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0275452740845743e+06, - "cpu_time": 2.8850850341041023e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0686643532060583e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0275683030539942e+06, - "cpu_time": 2.8850381676301570e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0686375860593171e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8501761324854606e+03, - "cpu_time": 6.8253390169087243e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9090375928268787e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4057274917189209e-03, - "cpu_time": 2.3657323566645503e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4062395324395630e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 340, - "real_time": 2.0660219135392897e+06, - "cpu_time": 3.6426908617647099e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0602705833015714e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 340, - "real_time": 2.0712384159731513e+06, - "cpu_time": 3.6430231294116643e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0500446183829074e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 340, - "real_time": 2.0693565160720882e+06, - "cpu_time": 3.6421347882353798e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0537277819689980e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 340, - "real_time": 2.0645776931333409e+06, - "cpu_time": 3.6422950882352469e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0631108375819407e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 340, - "real_time": 2.0723763058948165e+06, - "cpu_time": 3.6422569617647748e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0478208403265557e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0687141689225375e+06, - "cpu_time": 3.6424801658823555e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0549949323123951e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0693565160720882e+06, - "cpu_time": 3.6422950882352469e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0537277819689980e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3374522931381775e+03, - "cpu_time": 3.6829392824613694e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5436856110299183e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6132979332163829e-03, - "cpu_time": 1.0111075736137090e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6137345965308830e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 191, - "real_time": 3.6572477833918878e+06, - "cpu_time": 6.7295950418849112e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5873883842893724e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 191, - "real_time": 3.5219391971260933e+06, - "cpu_time": 6.8215138115184195e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7636302221487036e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 191, - "real_time": 3.6553445269709639e+06, - "cpu_time": 6.7229219947642796e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5897769351724005e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 191, - "real_time": 3.6582161321338871e+06, - "cpu_time": 6.7224092041885853e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5861740788436203e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 191, - "real_time": 3.6588235190186980e+06, - "cpu_time": 6.7155260261781663e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5854127461440592e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6303142317283065e+06, - "cpu_time": 6.7423932157068728e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6224764733196316e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6572477833918878e+06, - "cpu_time": 6.7229219947642786e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5873883842893724e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.0597804246986590e+04, - "cpu_time": 4.4508979344858082e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8924644934521690e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6692165024551446e-02, - "cpu_time": 6.6013621455911723e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7074104192863950e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 97, - "real_time": 7.3288212213473218e+06, - "cpu_time": 1.3708855391752252e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5784214113809958e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 97, - "real_time": 7.3328657344598128e+06, - "cpu_time": 1.3747849896906974e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5758961387108831e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 97, - "real_time": 7.3367700691229291e+06, - "cpu_time": 1.3779734876288315e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5734610303810778e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 97, - "real_time": 7.3299246801773915e+06, - "cpu_time": 1.3732899247422455e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5777321683458214e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 97, - "real_time": 7.3262990797994677e+06, - "cpu_time": 1.3740817113402275e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5799975723784456e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3309361569813844e+06, - "cpu_time": 1.3742031305154458e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5771016642394447e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3299246801773906e+06, - "cpu_time": 1.3740817113402274e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5777321683458214e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0235656750018934e+03, - "cpu_time": 2.5694966705673625e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5116258972386792e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4884745806579936e-04, - "cpu_time": 1.8698084828285744e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4873718817779950e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4480136562975086e+07, - "cpu_time": 2.6740455591837008e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6345463461714640e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4497214187012643e+07, - "cpu_time": 2.6736946959183153e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6290868807139235e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4493086736421196e+07, - "cpu_time": 2.6741884999999423e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6304051870023727e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4492231250113370e+07, - "cpu_time": 2.6740318183673322e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6306785229827890e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4498530221836908e+07, - "cpu_time": 2.6738624816326424e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6286666974645634e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4492239791671842e+07, - "cpu_time": 2.6739646110203870e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6306767268670225e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4493086736421194e+07, - "cpu_time": 2.6740318183673322e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6304051870023727e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2718576316434455e+03, - "cpu_time": 1.9005281235908449e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3246246827219226e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0177596673650919e-04, - "cpu_time": 7.1075290815670217e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0200539140090098e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.6911565512418747e+07, - "cpu_time": 4.9607792200001761e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9873623271029406e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.8028734177350998e+07, - "cpu_time": 5.0557589640000060e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7885761501301212e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8049841448664665e+07, - "cpu_time": 5.0590910240000546e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7849727865891218e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.8060932382941246e+07, - "cpu_time": 5.0570051880001754e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7830815515450735e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.7969188168644905e+07, - "cpu_time": 5.0426689639998585e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7987709614848928e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7804052338004112e+07, - "cpu_time": 5.0350606720000550e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8285527553704309e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8028734177350998e+07, - "cpu_time": 5.0557589640000068e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7885761501301212e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0017100819194072e+05, - "cpu_time": 4.2021004003387596e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8983718094542220e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7989140651568956e-02, - "cpu_time": 8.3456797724536218e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8428651938320943e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 14, - "real_time": 5.4892037596021377e+07, - "cpu_time": 9.6418511428571001e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8902439726423349e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 14, - "real_time": 5.4806699976325035e+07, - "cpu_time": 9.6393145214286894e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8978584026397619e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 14, - "real_time": 5.4894860567791119e+07, - "cpu_time": 9.6294117999998927e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8899924915284538e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 14, - "real_time": 4.9944533301251277e+07, - "cpu_time": 9.2230615714287624e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3746714256167612e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 14, - "real_time": 5.4967660989080153e+07, - "cpu_time": 9.6461495714286074e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8835160741754541e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3901158486093804e+07, - "cpu_time": 9.5559577214286119e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9872564733205528e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4892037596021377e+07, - "cpu_time": 9.6393145214286894e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8902439726423349e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2125551445329115e+06, - "cpu_time": 1.8619610233616817e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1663110243037808e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1048378303478184e-02, - "cpu_time": 1.9484818556557194e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3436928417307452e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0240637045353651e+08, - "cpu_time": 1.7761139387499726e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2425538530690079e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0681978613138199e+08, - "cpu_time": 1.8279985762499961e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0259500738906240e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0262513160705566e+08, - "cpu_time": 1.7748506062500268e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2313785482452831e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0687274672091007e+08, - "cpu_time": 1.8277000650000730e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0234594737421408e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0218540858477354e+08, - "cpu_time": 1.7695586899999681e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2538901535497522e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0418188869953156e+08, - "cpu_time": 1.7952443752500075e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1554464204993620e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0262513160705566e+08, - "cpu_time": 1.7761139387499726e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2313785482452831e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4372684652928682e+06, - "cpu_time": 2.9865713292040741e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1961858061053625e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3394358613733093e-02, - "cpu_time": 1.6636015521776310e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3202371017745901e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8502469733357430e+08, - "cpu_time": 3.1218213949998128e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8032351327898130e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8504615128040314e+08, - "cpu_time": 3.1210432125001830e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8025623152407169e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8525071069598198e+08, - "cpu_time": 3.1442122625000477e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7961549511253185e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8533523008227348e+08, - "cpu_time": 3.1271788000000811e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7935117005188255e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8482182547450066e+08, - "cpu_time": 3.1368380250000882e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8096051223568354e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8509572297334674e+08, - "cpu_time": 3.1302187390000427e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8010138444063015e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8504615128040314e+08, - "cpu_time": 3.1271788000000811e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8025623152407169e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0242695195027947e+05, - "cpu_time": 1.0044657149718512e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3449378974801637e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0936338706185470e-03, - "cpu_time": 3.2089313837943816e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0937636191987970e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8495616817090958e+06, - "cpu_time": 2.0681772860891975e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2145787515532179e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8512498740489676e+06, - "cpu_time": 2.0705354094489750e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2125592322345003e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8465863502001709e+06, - "cpu_time": 2.0662488635170530e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2181470146554434e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8458186856828802e+06, - "cpu_time": 2.0686705223096663e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2190695282102646e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8486293943348620e+06, - "cpu_time": 2.0676159711285145e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2156955918542794e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8483691971951958e+06, - "cpu_time": 2.0682496104986812e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2160100237015416e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8486293943348620e+06, - "cpu_time": 2.0681772860891973e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2156955918542794e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2063359549073289e+03, - "cpu_time": 1.5661865910096374e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6449322893385279e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1936662644320892e-03, - "cpu_time": 7.5725221127057767e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1935561035597349e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8481950452996541e+06, - "cpu_time": 2.0683600496082415e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4324326162619935e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8488367260026431e+06, - "cpu_time": 2.0690741827675749e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4308942400294403e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8463945218585930e+06, - "cpu_time": 2.0668132036556138e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4367549313100642e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8456584475358506e+06, - "cpu_time": 2.0697940704960926e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4385243710379815e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8467078323823437e+06, - "cpu_time": 2.0669675926891123e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4360021960982950e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8471585146158170e+06, - "cpu_time": 2.0682018198433269e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4349216709475545e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8467078323823437e+06, - "cpu_time": 2.0683600496082413e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4360021960982950e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3160347615585149e+03, - "cpu_time": 1.3012385887779933e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1592490856461841e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1246444262648017e-04, - "cpu_time": 6.2916422193099440e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1235735826901010e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8479710401799860e+06, - "cpu_time": 2.0695845183243612e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8659398030416407e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8517645663707955e+06, - "cpu_time": 2.0735296178010770e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8477770325362645e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8475350066301774e+06, - "cpu_time": 2.0692768455497876e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8680322382002920e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8455697651644705e+06, - "cpu_time": 2.0719366518325571e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8774752974672392e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8475832122112005e+06, - "cpu_time": 2.0694609319370987e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8678008609915413e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8480847181113262e+06, - "cpu_time": 2.0707577130889762e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8654050464473963e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8475832122112003e+06, - "cpu_time": 2.0695845183243614e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8678008609915413e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2601374454596225e+03, - "cpu_time": 1.8923760382356315e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0832426581543548e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2229620337802474e-03, - "cpu_time": 9.1385681013002209e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2218761043393488e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8521007619624936e+06, - "cpu_time": 2.0764239160105721e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7692341946492638e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8546653895544468e+06, - "cpu_time": 2.0794116194224742e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7667877011427909e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8528881365333421e+06, - "cpu_time": 2.0768805984251236e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7684823683585797e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8545784632114051e+06, - "cpu_time": 2.0825008845146156e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7668705126262832e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8552449394392984e+06, - "cpu_time": 2.0795172519684739e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7662357839339163e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8538955381401971e+06, - "cpu_time": 2.0789468540682520e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7675221121421669e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8545784632114053e+06, - "cpu_time": 2.0794116194224742e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7668705126262832e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3337935786100929e+03, - "cpu_time": 2.4396271146504546e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2719964834488537e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1945454917494241e-04, - "cpu_time": 1.1734918138366038e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1964954481233863e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8605728235214890e+06, - "cpu_time": 2.0899902219322724e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5223560814975582e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8601596820909549e+06, - "cpu_time": 2.0895257467364774e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5231383967172526e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8553675821103586e+06, - "cpu_time": 2.0850752271542058e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5322380660255536e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8569608926806506e+06, - "cpu_time": 2.0910815378592054e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5292073332462206e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8571960909551075e+06, - "cpu_time": 2.0867972819843392e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5287603888018392e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8580514142717118e+06, - "cpu_time": 2.0884940031333000e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5271400532576852e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8571960909551072e+06, - "cpu_time": 2.0895257467364774e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5287603888018392e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2319312372104291e+03, - "cpu_time": 2.4781743968268952e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2364049875749603e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2012214624778099e-03, - "cpu_time": 1.1865843967514248e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2010878285545238e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8621184086024095e+06, - "cpu_time": 2.1051236147758691e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0388649505041152e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8590636181861339e+06, - "cpu_time": 2.1054835804748554e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0504311266058430e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8633887072915144e+06, - "cpu_time": 2.1064318469657614e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0340664557593405e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8594925387671567e+06, - "cpu_time": 2.1026614749341104e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0488048361248448e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8624025012279239e+06, - "cpu_time": 2.1062554221636294e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0377912354381651e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8612931548150280e+06, - "cpu_time": 2.1051911878628451e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0419917208864614e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8621184086024095e+06, - "cpu_time": 2.1054835804748554e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0388649505041152e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9049990282405452e+03, - "cpu_time": 1.5133850076316312e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2088956591838665e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0234814560578238e-03, - "cpu_time": 7.1888245417177257e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0237012403468710e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8712539012440101e+06, - "cpu_time": 2.1344028488062485e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4009002189693582e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8695261634655287e+06, - "cpu_time": 2.1321779787799628e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4021948722775045e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8707581844618693e+06, - "cpu_time": 2.1338046392571265e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4012714319643974e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8696683047207159e+06, - "cpu_time": 2.1326897108754162e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4020882706205907e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8704543088591197e+06, - "cpu_time": 2.1331314137931149e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4014990837166950e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8703321725502487e+06, - "cpu_time": 2.1332413183023739e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4015907755097091e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8704543088591197e+06, - "cpu_time": 2.1331314137931149e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4014990837166950e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3081433221272925e+02, - "cpu_time": 8.8225907515999074e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4765187665158235e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.9074039517603126e-04, - "cpu_time": 4.1357677989384224e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9073593107262044e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8951969635259781e+06, - "cpu_time": 2.1981687338708406e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7664037569191337e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8945780142413210e+06, - "cpu_time": 2.1953553897850313e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7673075273701501e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8965431878822653e+06, - "cpu_time": 2.1966292043010350e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7644400789282054e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8955212704034932e+06, - "cpu_time": 2.1978034247311330e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7659304497722495e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8950752369898011e+06, - "cpu_time": 2.1961613360215374e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7665814515775955e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8953829346085719e+06, - "cpu_time": 2.1968236177419159e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7661326529134673e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8951969635259781e+06, - "cpu_time": 2.1966292043010350e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7664037569191337e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3186137980316005e+02, - "cpu_time": 1.1620527237127112e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0678179161261530e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8612850545386048e-04, - "cpu_time": 5.2896951504334652e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8603279383635453e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 369, - "real_time": 1.9068530537339489e+06, - "cpu_time": 2.2828953712736457e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4989869195568395e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 369, - "real_time": 1.9036304701919740e+06, - "cpu_time": 2.2819791246612854e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5082959451382124e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 369, - "real_time": 1.9089504382333297e+06, - "cpu_time": 2.2841993902439266e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4929451231349003e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 369, - "real_time": 1.9032467332691320e+06, - "cpu_time": 2.2810859024387635e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5094065402592468e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 369, - "real_time": 1.9102395282014650e+06, - "cpu_time": 2.2860943523035645e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4892383102723181e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9065840447259701e+06, - "cpu_time": 2.2832508281842372e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4997745676723039e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9068530537339491e+06, - "cpu_time": 2.2828953712736457e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4989869195568395e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1183326395031604e+03, - "cpu_time": 1.9631532252816730e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9953208952210261e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6355600206186308e-03, - "cpu_time": 8.5980620308933687e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6355799286929971e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 360, - "real_time": 1.9717222640691844e+06, - "cpu_time": 2.4984514249998331e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0636143021847091e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 360, - "real_time": 1.9469878806072907e+06, - "cpu_time": 2.4731190305554187e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0771263760233941e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 360, - "real_time": 1.9475345771449308e+06, - "cpu_time": 2.4753228027776685e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0768240136071973e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 360, - "real_time": 1.9522927929453240e+06, - "cpu_time": 2.4792104861110905e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0741995296904898e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 360, - "real_time": 1.9450710056440181e+06, - "cpu_time": 2.4721600888887625e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0781878882131748e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9527217040821500e+06, - "cpu_time": 2.4796527666665548e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0739904219437931e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9475345771449306e+06, - "cpu_time": 2.4753228027776685e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0768240136071973e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0948989093473192e+04, - "cpu_time": 1.0853152564406282e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9830961903549572e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.6070401996272242e-03, - "cpu_time": 4.3768840179169051e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5709027456001658e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 347, - "real_time": 2.0241023330501034e+06, - "cpu_time": 2.8906264755041040e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0721798159679198e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 347, - "real_time": 2.0251780773864614e+06, - "cpu_time": 2.8910917608070886e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0710791050102839e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 347, - "real_time": 2.0288488400230450e+06, - "cpu_time": 2.8909453746396652e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0673319358540082e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 347, - "real_time": 2.0296571988301077e+06, - "cpu_time": 2.8946594927956355e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0665085721951432e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 347, - "real_time": 2.0236352465977031e+06, - "cpu_time": 2.8887146772333337e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0726581072610781e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0262843391774842e+06, - "cpu_time": 2.8912075561959655e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0699515072576866e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0251780773864612e+06, - "cpu_time": 2.8909453746396648e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0710791050102839e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7818835439853251e+03, - "cpu_time": 2.1534921815722578e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8407074895666395e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3728989017970481e-03, - "cpu_time": 7.4484177967688403e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3723546081183642e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 326, - "real_time": 2.1448431374430885e+06, - "cpu_time": 3.7328274386502234e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9110589737579746e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 326, - "real_time": 2.1490079973555780e+06, - "cpu_time": 3.7325350828219191e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9034791914792528e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 326, - "real_time": 2.1401525395093886e+06, - "cpu_time": 3.7305162331290515e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9196308885174212e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 326, - "real_time": 2.1458422990824366e+06, - "cpu_time": 3.7339174355829414e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9092378799630218e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 326, - "real_time": 2.1421480777479163e+06, - "cpu_time": 3.7363427791411802e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9159795194079742e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1443988102276819e+06, - "cpu_time": 3.7332277938650632e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9118772906251292e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1448431374430889e+06, - "cpu_time": 3.7328274386502234e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9110589737579746e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4140263777429036e+03, - "cpu_time": 2.1313982194944720e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2271735495841131e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5920669054001286e-03, - "cpu_time": 5.7092637716805517e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5918632121993256e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 175, - "real_time": 4.0119184407272511e+06, - "cpu_time": 7.1580054171428336e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1818437358259830e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 175, - "real_time": 4.0125940540539366e+06, - "cpu_time": 7.1580851142860930e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1811396253877025e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 175, - "real_time": 4.0137771623475212e+06, - "cpu_time": 7.1583012342853183e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1799071850285730e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 175, - "real_time": 4.0174901512052333e+06, - "cpu_time": 7.1628068285709955e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1760440893593464e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 175, - "real_time": 4.0339318410094297e+06, - "cpu_time": 7.1775875999998925e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1590231717454500e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0179423298686752e+06, - "cpu_time": 7.1629572388570262e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1755915614694118e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0137771623475207e+06, - "cpu_time": 7.1583012342853174e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1799071850285730e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1938681620416428e+03, - "cpu_time": 8.4262477574780605e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5290558771454375e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2882031167286913e-03, - "cpu_time": 1.1763643808688456e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2820852415441021e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 91, - "real_time": 7.8228838424515594e+06, - "cpu_time": 1.3974281736263299e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2892662956228442e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 91, - "real_time": 7.8336743146672351e+06, - "cpu_time": 1.3984357472527886e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2833580580666952e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 91, - "real_time": 7.9086180315813525e+06, - "cpu_time": 1.4067147978021938e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2427680621326823e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 91, - "real_time": 7.8443591636452042e+06, - "cpu_time": 1.3989186527472876e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2775236701945643e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 91, - "real_time": 7.8262473241640972e+06, - "cpu_time": 1.3970681681318916e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2874229001680408e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8471565353018893e+06, - "cpu_time": 1.3997131079120984e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2760677972369652e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8336743146672351e+06, - "cpu_time": 1.3984357472527886e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2833580580666952e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5332243825365091e+04, - "cpu_time": 3.9844416707069919e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9152536054519776e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5025537169312776e-03, - "cpu_time": 2.8466131010592877e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4790066394399608e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 47, - "real_time": 1.5231551939344153e+07, - "cpu_time": 2.7221261744680885e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4059111157710171e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 47, - "real_time": 1.5242428538647104e+07, - "cpu_time": 2.7270055446808059e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4027671725569057e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 47, - "real_time": 1.5231613149034215e+07, - "cpu_time": 2.7250683787235387e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4058934101970110e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 47, - "real_time": 1.5246748527947893e+07, - "cpu_time": 2.7263369489361972e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4015196995599947e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 47, - "real_time": 1.5222166367667787e+07, - "cpu_time": 2.7242926234042354e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4086276801271000e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5234901704528231e+07, - "cpu_time": 2.7249659340425737e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4049438156424055e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5231613149034213e+07, - "cpu_time": 2.7250683787235387e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4058934101970110e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7624892529542867e+03, - "cpu_time": 1.9083874051124250e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8227027375053153e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.4079765280353640e-04, - "cpu_time": 7.0033440832094058e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4080334634044808e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 24, - "real_time": 2.9973543404291075e+07, - "cpu_time": 5.2200686166666329e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4778732427339611e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 24, - "real_time": 3.0051517765969038e+07, - "cpu_time": 5.2276954708332829e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4662545514420223e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 24, - "real_time": 2.9974863864481449e+07, - "cpu_time": 5.2216589000001550e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4776759823433447e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 24, - "real_time": 2.9641681195547182e+07, - "cpu_time": 5.0824407041664205e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.5280065970132084e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 24, - "real_time": 3.0002350841338437e+07, - "cpu_time": 5.2257046583330669e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4735737112663002e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9928791414325438e+07, - "cpu_time": 5.1955136699999116e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4846768169597683e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9974863864481449e+07, - "cpu_time": 5.2216589000001557e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4776759823433447e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6357753183593700e+05, - "cpu_time": 6.3283445981883770e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4675032775363844e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4655575486299282e-03, - "cpu_time": 1.2180402170298754e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5020760207402037e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.8860427513718605e+07, - "cpu_time": 9.9357217800002217e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5605420711128159e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.8955963328480721e+07, - "cpu_time": 9.9415354799998567e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5531518924451694e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.9739521890878677e+07, - "cpu_time": 9.8037372099997804e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.4934316094850779e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.8992460742592812e+07, - "cpu_time": 9.9436392399991289e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5503349516354122e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.9031324833631516e+07, - "cpu_time": 9.9351197500004679e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5473391755400019e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9115939661860481e+07, - "cpu_time": 9.9119506919998914e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5409599400436954e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8992460742592812e+07, - "cpu_time": 9.9357217800002217e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5503349516354122e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5430932604611904e+05, - "cpu_time": 6.0604148610737780e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7016806131176941e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.9934651816878235e-03, - "cpu_time": 6.1142504128528863e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9495803724084325e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7, - "real_time": 1.1530271598270962e+08, - "cpu_time": 1.9039912242856511e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6561861741444778e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7, - "real_time": 1.0935783705541065e+08, - "cpu_time": 1.8220304957143137e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9093044125220966e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7, - "real_time": 1.1527188335146223e+08, - "cpu_time": 1.9057230757141498e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6574315990230570e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7, - "real_time": 1.0945353763444082e+08, - "cpu_time": 1.8139612985714847e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9050119676631384e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7, - "real_time": 1.1526573449373245e+08, - "cpu_time": 1.9055464842857161e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6576800499995270e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1293034170355117e+08, - "cpu_time": 1.8702505157142633e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.7571228406704597e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1526573449373245e+08, - "cpu_time": 1.9039912242856514e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6576800499995270e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2177629064972671e+06, - "cpu_time": 4.7791708539718045e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3697248594233689e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8493342515017669e-02, - "cpu_time": 2.5553640080920398e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8793136214879046e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 2.1480339393019676e+08, - "cpu_time": 3.3517436725000495e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9987190814542103e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 2.1480798721313477e+08, - "cpu_time": 3.3650692025000238e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9986121928260612e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 2.1478202566504478e+08, - "cpu_time": 3.3651698900001746e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9992163947392578e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 2.1454587206244469e+08, - "cpu_time": 3.3638314300000614e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.0047191012255030e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 2.1467530727386475e+08, - "cpu_time": 3.3635003825000352e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.0017015819626160e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1472291722893715e+08, - "cpu_time": 3.3618629155000693e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.0005936704415302e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1478202566504478e+08, - "cpu_time": 3.3638314300000614e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 4.9992163947392578e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1271524707542386e+05, - "cpu_time": 5.7046424752515904e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6260175570471724e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.2493347487099886e-04, - "cpu_time": 1.6968694496584012e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2514115925265861e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8448775106910262e+06, - "cpu_time": 2.0675181020940046e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2202015994361504e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8389344356188562e+06, - "cpu_time": 2.0664143534032444e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2273768551305500e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8437989660471992e+06, - "cpu_time": 2.0665129397906144e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2215003237479562e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8478626551916299e+06, - "cpu_time": 2.0703016465966769e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2166149570110939e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8433717469390999e+06, - "cpu_time": 2.0659443089002657e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2220151777856890e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8437690628975625e+06, - "cpu_time": 2.0673382701569614e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2215417826222880e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8437989660471990e+06, - "cpu_time": 2.0665129397906144e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2215003237479562e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2217436844457261e+03, - "cpu_time": 1.7529874368502794e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8840569822490274e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7473683387346881e-03, - "cpu_time": 8.4794417157342365e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7483609863345993e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8481717638892953e+06, - "cpu_time": 2.0719113141360320e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4324884515932351e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8387099324991615e+06, - "cpu_time": 2.0675085026178958e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4552976275412245e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8437792741440916e+06, - "cpu_time": 2.0671652617798678e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4430480995632419e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8491409866985588e+06, - "cpu_time": 2.0720075209424163e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4301651734116441e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8437311095522330e+06, - "cpu_time": 2.0668396544504084e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4431641672464395e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8447066133566680e+06, - "cpu_time": 2.0690864507853244e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4408327038711570e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8437792741440919e+06, - "cpu_time": 2.0675085026178956e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4430480995632419e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1666137972816150e+03, - "cpu_time": 2.6335093123564347e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0037435784303849e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2586864312802318e-03, - "cpu_time": 1.2727884382776192e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2602598327007518e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8488121770314095e+06, - "cpu_time": 2.0743977905759250e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8619061490104254e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8449922438762125e+06, - "cpu_time": 2.0698568324606232e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8802541335232109e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8500260001838363e+06, - "cpu_time": 2.0746413612565061e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8560917513439972e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8506052820633668e+06, - "cpu_time": 2.0759172382199673e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8533195915945694e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8446818823805470e+06, - "cpu_time": 2.0702524738219059e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8817482062850762e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8478235171070744e+06, - "cpu_time": 2.0730131392669857e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8666639663514551e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8488121770314095e+06, - "cpu_time": 2.0743977905759248e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8619061490104254e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8041296905173449e+03, - "cpu_time": 2.7652171333929355e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3460199032268478e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5175311194802032e-03, - "cpu_time": 1.3339120148416967e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5180680223530810e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8540645506470990e+06, - "cpu_time": 2.0820072774868642e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7673602566082951e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8497181540743341e+06, - "cpu_time": 2.0777905183243698e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7715131317613248e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8555744993508030e+06, - "cpu_time": 2.0837191806283463e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7659220910539735e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8545215193173699e+06, - "cpu_time": 2.0826159869108959e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7669247651578378e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8475547933112036e+06, - "cpu_time": 2.0758048795811068e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7735874529205658e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8522867033401621e+06, - "cpu_time": 2.0803875685863167e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7690615395003993e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8540645506470990e+06, - "cpu_time": 2.0820072774868645e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7673602566082951e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4624111525048056e+03, - "cpu_time": 3.4071488274665708e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3094750912625859e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8692630823625544e-03, - "cpu_time": 1.6377471577480279e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8707518180499333e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8544072087869728e+06, - "cpu_time": 2.0888491469815988e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5340673660813250e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8489516128486774e+06, - "cpu_time": 2.0830623569554400e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5444951368429147e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8553713919732992e+06, - "cpu_time": 2.0891097664042504e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5322308128454275e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8552420660662416e+06, - "cpu_time": 2.0889224881888526e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5324770389105670e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8491439579634957e+06, - "cpu_time": 2.0825536850391536e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5441264439019822e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8526232475277376e+06, - "cpu_time": 2.0864994887138593e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5374793597164437e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8544072087869730e+06, - "cpu_time": 2.0888491469815988e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5340673660813250e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2855510683642292e+03, - "cpu_time": 3.3759669506645978e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2772807632963173e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7734588361388024e-03, - "cpu_time": 1.6180051655539009e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7745066825773620e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8557355028156708e+06, - "cpu_time": 2.1045180236220532e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0630755191743135e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8473755571092269e+06, - "cpu_time": 2.0994207952756626e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0950381201915130e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8553680491959432e+06, - "cpu_time": 2.1030241469816840e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0644743535818890e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8527979490144323e+06, - "cpu_time": 2.1009471207346204e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0742738067970008e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8560622166108896e+06, - "cpu_time": 2.1046385931758108e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0618322396182001e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8534678549492327e+06, - "cpu_time": 2.1025097359579662e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0717388078725830e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8553680491959429e+06, - "cpu_time": 2.1030241469816845e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0644743535818890e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6417215840937642e+03, - "cpu_time": 2.2810738681240819e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3921648033727903e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9648150758964805e-03, - "cpu_time": 1.0849290393819537e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9686315363103752e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8602413098530010e+06, - "cpu_time": 2.1288735131580131e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4091935202789095e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8593630033903634e+06, - "cpu_time": 2.1282410894735605e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4098591803860059e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8587246855435967e+06, - "cpu_time": 2.1277815447367751e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4103433501413590e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8597120602958295e+06, - "cpu_time": 2.1280394763158783e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4095945581935948e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8604004747574339e+06, - "cpu_time": 2.1283861789473388e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4090729579833037e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8596883067680448e+06, - "cpu_time": 2.1282643605263131e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4096127133966348e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8597120602958295e+06, - "cpu_time": 2.1282410894735605e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4095945581935948e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7969626219369388e+02, - "cpu_time": 4.0930801171348645e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1525828862814036e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6548934556400952e-04, - "cpu_time": 1.9232009862358730e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6553181149066280e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 374, - "real_time": 1.8833050484716753e+06, - "cpu_time": 2.1915884786098260e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7838718981052274e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 374, - "real_time": 1.8832257955508146e+06, - "cpu_time": 2.1903976310162288e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7839890534562999e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 374, - "real_time": 1.8852428929384716e+06, - "cpu_time": 2.1916770401068232e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7810103513123870e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 374, - "real_time": 1.8852459087645395e+06, - "cpu_time": 2.1922621470586797e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7810059025328016e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 374, - "real_time": 1.8811021198582072e+06, - "cpu_time": 2.1900729866310428e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7871320459705794e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8836243531167419e+06, - "cpu_time": 2.1911996566845202e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7834018502754593e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8833050484716755e+06, - "cpu_time": 2.1915884786098260e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7838718981052274e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7227578231559733e+03, - "cpu_time": 9.2474236916440714e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5465636324270398e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.1459734012538604e-04, - "cpu_time": 4.2202560882271422e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1491051936141358e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8754846017497282e+06, - "cpu_time": 2.2692994586665616e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5909603257831812e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8794845884355404e+06, - "cpu_time": 2.2717815813333192e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5790614429715621e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8755114488303661e+06, - "cpu_time": 2.2694798506666608e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5908802937669528e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8811353886655222e+06, - "cpu_time": 2.2726140266665122e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5741655083309031e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8747771332661312e+06, - "cpu_time": 2.2687112080002408e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5930701382794762e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8772786321894575e+06, - "cpu_time": 2.2703772250666590e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5856275418264151e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8755114488303661e+06, - "cpu_time": 2.2694798506666608e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5908802937669528e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8434043231740284e+03, - "cpu_time": 1.7115761749764254e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4544972600385884e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5146416064288680e-03, - "cpu_time": 7.5387303751964512e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5136163657045590e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 366, - "real_time": 1.9194959396308113e+06, - "cpu_time": 2.4719223579237084e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0925534963118277e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 366, - "real_time": 1.9186605478934639e+06, - "cpu_time": 2.4710519016391411e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0930291980530405e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 366, - "real_time": 1.9182185790325957e+06, - "cpu_time": 2.4710797950818683e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0932810384193258e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 366, - "real_time": 1.9205276589698154e+06, - "cpu_time": 2.4721486038251002e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0919665698149471e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 366, - "real_time": 1.9209447027059384e+06, - "cpu_time": 2.4721109918034114e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0917295000974505e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9195694856465249e+06, - "cpu_time": 2.4716627300546458e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0925119605393183e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9194959396308116e+06, - "cpu_time": 2.4719223579237084e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0925534963118277e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1689571862897401e+03, - "cpu_time": 5.5166635805831515e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6528866588872531e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.0896841454844591e-04, - "cpu_time": 2.2319645449608673e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0895321050792497e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 349, - "real_time": 2.0156135394993136e+06, - "cpu_time": 2.8869493667621245e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0809068394340525e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 349, - "real_time": 2.0166579103577656e+06, - "cpu_time": 2.8872358595988271e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0798291958480496e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 349, - "real_time": 2.0133281596282492e+06, - "cpu_time": 2.8866652234955314e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0832689295789998e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 349, - "real_time": 2.0128527267924096e+06, - "cpu_time": 2.8863194441261129e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0837609946177492e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 349, - "real_time": 2.0112229389722932e+06, - "cpu_time": 2.8866731432665940e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0854495634100270e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0139350550500061e+06, - "cpu_time": 2.8867686074498380e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0826431045777757e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0133281596282492e+06, - "cpu_time": 2.8866731432665940e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0832689295789998e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1866973499463475e+03, - "cpu_time": 3.4371057552330313e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2610973682705485e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0857834489067233e-03, - "cpu_time": 1.1906412402999486e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0856864353285109e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 344, - "real_time": 2.0395864757606324e+06, - "cpu_time": 3.6472685174418911e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1128964619514828e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 344, - "real_time": 2.0378803973746768e+06, - "cpu_time": 3.6474702325582323e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1163397080646744e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 344, - "real_time": 2.0379083042255016e+06, - "cpu_time": 3.6487464912792230e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1162833394449778e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 344, - "real_time": 2.0431502066352298e+06, - "cpu_time": 3.6472416656974559e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1057226104853120e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 344, - "real_time": 2.0340222768555935e+06, - "cpu_time": 3.6453632267440897e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1241475550444784e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0385095321703267e+06, - "cpu_time": 3.6472180267441785e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1150779349981852e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0379083042255018e+06, - "cpu_time": 3.6472685174418911e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1162833394449778e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3010760699338070e+03, - "cpu_time": 1.2086358796415122e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6630323488573879e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6193576815994924e-03, - "cpu_time": 3.3138569473469204e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6191752511390350e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 189, - "real_time": 3.7016252427800465e+06, - "cpu_time": 6.8701339259258593e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5323918278122988e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 189, - "real_time": 3.6957475218783924e+06, - "cpu_time": 6.8673138624338508e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5396001487333336e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 189, - "real_time": 3.6927617214147062e+06, - "cpu_time": 6.8684546296295868e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5432706645292587e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 189, - "real_time": 3.6953251424526409e+06, - "cpu_time": 6.8653850582014602e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5401190296518040e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 189, - "real_time": 3.6972967646621838e+06, - "cpu_time": 6.8714596878303308e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5376979636453142e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6965512786375941e+06, - "cpu_time": 6.8685494328042176e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5386159268744011e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6957475218783924e+06, - "cpu_time": 6.8684546296295868e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5396001487333336e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2715073107378880e+03, - "cpu_time": 2.3732409866135504e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0148679596519736e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.8501607691578925e-04, - "cpu_time": 3.4552288075251271e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8460183111746234e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 96, - "real_time": 7.4185488580648480e+06, - "cpu_time": 1.3931253145833248e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5230452264963284e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 96, - "real_time": 7.4056787755883606e+06, - "cpu_time": 1.3932688218749451e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5309056761423187e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 96, - "real_time": 7.4191405486393096e+06, - "cpu_time": 1.3935714635415763e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5226845050339384e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 96, - "real_time": 7.4099039047723636e+06, - "cpu_time": 1.3917241645832708e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5283221525166073e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 96, - "real_time": 7.4032521515619010e+06, - "cpu_time": 1.3938129572916105e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5323908078587942e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4113048477253569e+06, - "cpu_time": 1.3931005443749458e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5274696736095982e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4099039047723636e+06, - "cpu_time": 1.3932688218749454e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5283221525166073e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2858619768451390e+03, - "cpu_time": 8.1434778120442088e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4503923005505931e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.8307411805915405e-04, - "cpu_time": 5.8455779411801254e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.8297561803488485e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4519269559152272e+07, - "cpu_time": 2.6786606081632920e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6220551059125214e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4518306438564038e+07, - "cpu_time": 2.6759709877549596e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6223617254518795e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4544023980139470e+07, - "cpu_time": 2.6857333102041095e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6141882117108870e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4530165957248941e+07, - "cpu_time": 2.6825935591836132e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6185889546925735e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4534032029308835e+07, - "cpu_time": 2.6839294326529332e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6173604038212204e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4529159592882713e+07, - "cpu_time": 2.6813775795917820e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6189108803178167e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4530165957248941e+07, - "cpu_time": 2.6825935591836132e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6185889546925735e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0739030917139153e+04, - "cpu_time": 3.9867317005041819e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4134183368582292e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.3913641380880693e-04, - "cpu_time": 1.4868221957428053e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3900935205386772e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.8186086831348281e+07, - "cpu_time": 5.1086727785713851e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7618432740625916e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.8158069654767003e+07, - "cpu_time": 5.1155324035712674e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7665812907483063e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.8154583448278051e+07, - "cpu_time": 5.1071942892856933e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7671715067838736e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.8174132441303559e+07, - "cpu_time": 5.1085365571428351e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7638637420201616e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.8176292111831050e+07, - "cpu_time": 5.1078754999999933e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7634985990098677e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8169832897505593e+07, - "cpu_time": 5.1095623057142347e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7645916825249605e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8174132441303562e+07, - "cpu_time": 5.1085365571428351e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7638637420201616e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3184436597029184e+04, - "cpu_time": 3.3888900246529498e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2300511256560911e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6803389445013898e-04, - "cpu_time": 6.6324468161646922e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6804663951272566e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.1808930933475494e+07, - "cpu_time": 9.2547179700000018e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.1812583499296799e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.4739557206630707e+07, - "cpu_time": 9.5645050899997845e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9038660467550125e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.4677268862724304e+07, - "cpu_time": 9.5614573700004250e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9094525308853397e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.4764563962817192e+07, - "cpu_time": 9.5643009100001559e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9016268290249920e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.1790754869580269e+07, - "cpu_time": 9.2592047899995580e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.1830767223991127e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3556215167045593e+07, - "cpu_time": 9.4408372259999841e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0158560957988272e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4677268862724304e+07, - "cpu_time": 9.5614573700004250e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9094525308853397e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6036691396836899e+06, - "cpu_time": 1.6786673304535244e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5184898643964300e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9943660781138720e-02, - "cpu_time": 1.7780915932227800e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0273792457249409e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 9.6866594627499580e+07, - "cpu_time": 1.7536841100000799e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.5423741700070772e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0708353482186794e+08, - "cpu_time": 1.8428507462500933e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0135710676069641e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 9.6901213750243187e+07, - "cpu_time": 1.7543114887500623e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.5403940902510386e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0690589249134064e+08, - "cpu_time": 1.8363667037499455e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0219019690003195e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 9.6725872717797756e+07, - "cpu_time": 1.7538594900000247e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.5504375087557592e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0089662168174982e+08, - "cpu_time": 1.7882145077500409e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3337357611242323e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6901213750243187e+07, - "cpu_time": 1.7543114887500623e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.5403940902510386e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5675124468610566e+06, - "cpu_time": 4.6972818862983203e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8850608441182077e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.5180365348824242e-02, - "cpu_time": 2.6268000096971098e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4090809393791593e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8047043308615685e+08, - "cpu_time": 3.2223051799999779e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9496827576592236e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8141903728246689e+08, - "cpu_time": 3.2160944000000316e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9185730454968681e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8042083457112312e+08, - "cpu_time": 3.2186691075000340e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9513183527411499e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8105695024132729e+08, - "cpu_time": 3.2107916974999285e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9304093135824413e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8062078952789307e+08, - "cpu_time": 3.2182101200001514e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9447299882064972e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8079760894179344e+08, - "cpu_time": 3.2172141010000247e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9389426915372362e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8062078952789307e+08, - "cpu_time": 3.2182101200001514e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9447299882064972e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2828120560725091e+05, - "cpu_time": 4.2287462737212126e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4051155045248060e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3688433055833891e-03, - "cpu_time": 1.3144124515700611e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3659354492964568e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8406364214624821e+06, - "cpu_time": 2.0688655404700448e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2253172610512148e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8362169785533883e+06, - "cpu_time": 2.0692797650131891e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2306731981243948e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8444580504170426e+06, - "cpu_time": 2.0775811644909491e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2207065100091980e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8412216808566370e+06, - "cpu_time": 2.0688157624020020e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2246099112271573e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8453917285971837e+06, - "cpu_time": 2.0747129895559023e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2195829408608368e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8415849719773468e+06, - "cpu_time": 2.0718510443864174e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2241779642545604e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8412216808566370e+06, - "cpu_time": 2.0692797650131888e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2246099112271573e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6260535571700225e+03, - "cpu_time": 4.0547088223529236e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3828607372568322e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9689852015227164e-03, - "cpu_time": 1.9570464939257901e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9705530796973614e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8401956705654019e+06, - "cpu_time": 2.0697489712793150e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4517005071982378e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8381975551972326e+06, - "cpu_time": 2.0730014229765197e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4565394926341446e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8423320934150305e+06, - "cpu_time": 2.0720747754566818e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4465381834688317e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8475979159500415e+06, - "cpu_time": 2.0765598250652952e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4338651441851426e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8454807002797078e+06, - "cpu_time": 2.0748929608355938e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4389518669896638e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8427607870814831e+06, - "cpu_time": 2.0732555911226813e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4455190388952047e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8423320934150300e+06, - "cpu_time": 2.0730014229765194e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4465381834688317e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8204197979231722e+03, - "cpu_time": 2.6150645945912024e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2146705770078097e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0732044141083855e-03, - "cpu_time": 1.2613324694690094e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0727997105367993e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8429269871459277e+06, - "cpu_time": 2.0733562375978820e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8902056968481913e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8390393196813357e+06, - "cpu_time": 2.0750092375980995e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9089992936306447e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8437044144592579e+06, - "cpu_time": 2.0743382663184393e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8864570001071896e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8494143219326995e+06, - "cpu_time": 2.0803324125326935e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8590208292959332e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8467786932185076e+06, - "cpu_time": 2.0771026919060289e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8716639736873303e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8443727472875458e+06, - "cpu_time": 2.0760277691906285e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8832693587138578e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8437044144592576e+06, - "cpu_time": 2.0750092375980995e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8864570001071896e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9429808492143770e+03, - "cpu_time": 2.7710251151792004e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8993285233084680e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1378438035441483e-03, - "cpu_time": 1.3347726635947296e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1380962870897989e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8453161843658637e+06, - "cpu_time": 2.0793927670157431e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7757390455696139e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8428797614276141e+06, - "cpu_time": 2.0820795078531571e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7780867035305541e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8457279288454081e+06, - "cpu_time": 2.0797859345550085e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7753429141909320e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8498733229177860e+06, - "cpu_time": 2.0844501361256910e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7713645358329386e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8501317191051370e+06, - "cpu_time": 2.0848482905758894e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7711171405595418e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8467857833323616e+06, - "cpu_time": 2.0821113272250979e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7743300679367162e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8457279288454081e+06, - "cpu_time": 2.0820795078531574e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7753429141909320e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1330484853493640e+03, - "cpu_time": 2.5377169173772318e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0100111909312312e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6964872231667574e-03, - "cpu_time": 1.2188190344074132e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6964212269881835e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8479419507109744e+06, - "cpu_time": 2.0861821020941238e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5464317466674633e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8430221458421277e+06, - "cpu_time": 2.0869284502616343e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5558986715297878e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8475205921010282e+06, - "cpu_time": 2.0862084083769119e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5472405709682234e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8540437688931569e+06, - "cpu_time": 2.0928460471206456e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5347601334743164e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8548952958501475e+06, - "cpu_time": 2.0934520785339568e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5331374308091670e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8494847506794869e+06, - "cpu_time": 2.0891234172774546e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5434937106897913e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8479419507109742e+06, - "cpu_time": 2.0869284502616343e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5464317466674633e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9513144229657819e+03, - "cpu_time": 3.6932970811797591e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4879130311939516e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6771317909740568e-03, - "cpu_time": 1.7678692654706167e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6775588743311175e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 385, - "real_time": 1.8488040054065790e+06, - "cpu_time": 2.0996968337660246e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0895562545676842e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 385, - "real_time": 1.8453022828340747e+06, - "cpu_time": 2.0996292259738976e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1030096921950042e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 385, - "real_time": 1.8517093519398989e+06, - "cpu_time": 2.1032680805192641e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0784326850585669e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 385, - "real_time": 1.8444216407626842e+06, - "cpu_time": 2.1001675350648779e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1064011125894502e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 385, - "real_time": 1.8476170762865383e+06, - "cpu_time": 2.1000619870129451e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0941106619038776e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8475708714459552e+06, - "cpu_time": 2.1005647324674022e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0943020812629163e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8476170762865383e+06, - "cpu_time": 2.1000619870129446e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0941106619038776e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9031845976935506e+03, - "cpu_time": 1.5286456432740290e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1142332514446873e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5713522239184500e-03, - "cpu_time": 7.2773079526971987e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5706030539459821e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8553337717533174e+06, - "cpu_time": 2.1270033899204209e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4129209740642521e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8645930117853379e+06, - "cpu_time": 2.1364522599469637e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4059046577086464e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8488077113861267e+06, - "cpu_time": 2.1204710795756006e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4179084086763135e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8465481714338721e+06, - "cpu_time": 2.1215887984085828e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4196434409639111e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8480480021725479e+06, - "cpu_time": 2.1217454084880929e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4184912929308435e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8526661337062407e+06, - "cpu_time": 2.1254521872679321e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4149737548687932e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8488077113861269e+06, - "cpu_time": 2.1217454084880934e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4179084086763135e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4667720182566818e+03, - "cpu_time": 6.6499106170754985e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6844891491672315e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0302847244902537e-03, - "cpu_time": 3.1287039327021178e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0173813327684929e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 373, - "real_time": 1.8731012435420230e+06, - "cpu_time": 2.1837169410187760e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7990371679460031e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 373, - "real_time": 1.8736056879851918e+06, - "cpu_time": 2.1853096058980883e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7982835628760314e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 373, - "real_time": 1.8755518653412568e+06, - "cpu_time": 2.1860651796245212e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7953799075804591e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 373, - "real_time": 1.8783310904534629e+06, - "cpu_time": 2.1869950214475822e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7912437943697536e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 373, - "real_time": 1.8802351898347696e+06, - "cpu_time": 2.1885104369972399e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7884171237432969e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8761650154313408e+06, - "cpu_time": 2.1861194369972418e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7944723113031083e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8755518653412566e+06, - "cpu_time": 2.1860651796245212e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7953799075804591e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0647597327134799e+03, - "cpu_time": 1.7968226347505865e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5627815998577006e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6335235480386962e-03, - "cpu_time": 8.2192336079250255e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6327882661073857e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 374, - "real_time": 1.8793994916153492e+06, - "cpu_time": 2.2691480534757329e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5793140557824981e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 374, - "real_time": 1.8708480339631799e+06, - "cpu_time": 2.2647848128344705e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6048165375501430e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 374, - "real_time": 1.8780673089882927e+06, - "cpu_time": 2.2685835748662236e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5832716696658957e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 374, - "real_time": 1.8697994803813072e+06, - "cpu_time": 2.2644040695187119e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6079596288376570e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 374, - "real_time": 1.8828296914844858e+06, - "cpu_time": 2.2734929732621065e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5691494814555836e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8761888012865230e+06, - "cpu_time": 2.2680826967914486e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5889022746583557e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8780673089882925e+06, - "cpu_time": 2.2685835748662236e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5832716696658957e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6410540553520714e+03, - "cpu_time": 3.7102995972037170e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6809647563229874e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0066558607981988e-03, - "cpu_time": 1.6358749186934430e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0076832152620583e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 366, - "real_time": 1.9192412427863199e+06, - "cpu_time": 2.4654336803278779e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0926984858638160e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 366, - "real_time": 1.9207734559265680e+06, - "cpu_time": 2.4670354808746031e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0918268333671594e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 366, - "real_time": 1.9200408024601436e+06, - "cpu_time": 2.4666158989071236e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0922434550937274e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 366, - "real_time": 1.9182296666377757e+06, - "cpu_time": 2.4651541639342648e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0932747191194444e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 366, - "real_time": 1.9191507381435402e+06, - "cpu_time": 2.4658475191258132e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0927500160975611e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9194871811908695e+06, - "cpu_time": 2.4660173486339366e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0925587019083416e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9192412427863199e+06, - "cpu_time": 2.4658475191258132e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0926984858638160e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6384927234144959e+02, - "cpu_time": 7.9206285490094137e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4859671803611808e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0213894720748677e-04, - "cpu_time": 3.2119111219542268e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0212104583296038e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 349, - "real_time": 2.0131426349677211e+06, - "cpu_time": 2.8756120716333338e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0834609168501625e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 349, - "real_time": 2.0170326032448977e+06, - "cpu_time": 2.8764783123209192e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0794428375884559e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 349, - "real_time": 2.0221292500232044e+06, - "cpu_time": 2.8811733094556187e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0742017355972023e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 349, - "real_time": 2.0141383268761004e+06, - "cpu_time": 2.8757871575931795e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0824309552290311e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 349, - "real_time": 2.0142204166899694e+06, - "cpu_time": 2.8752231489969948e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0823460854858325e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0161326463603787e+06, - "cpu_time": 2.8768548000000096e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0803765061501369e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0142204166899696e+06, - "cpu_time": 2.8757871575931795e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0823460854858325e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6518241513641574e+03, - "cpu_time": 2.4565110412358367e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7620845786558283e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8113015321470089e-03, - "cpu_time": 8.5388773921986902e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8083671717759370e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 340, - "real_time": 2.0696518658523392e+06, - "cpu_time": 3.6221154852940426e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0531492945289817e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 340, - "real_time": 2.0667831314152437e+06, - "cpu_time": 3.6229382676471206e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0587751431161742e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 340, - "real_time": 2.0702282750896888e+06, - "cpu_time": 3.6297166029411904e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0520207848270154e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 340, - "real_time": 2.0696165221606325e+06, - "cpu_time": 3.6221706470588711e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0532185118248301e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 340, - "real_time": 2.0687623832867865e+06, - "cpu_time": 3.6217085147059686e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0548919816844487e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0690084355609384e+06, - "cpu_time": 3.6237299035294391e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0544111431962900e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0696165221606325e+06, - "cpu_time": 3.6221706470588716e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0532185118248301e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3494721738580133e+03, - "cpu_time": 3.3760515749092347e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6459471714151814e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.5223135423909072e-04, - "cpu_time": 9.3165099629004624e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5260948580790753e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 192, - "real_time": 3.6390056593518239e+06, - "cpu_time": 6.6662588125000848e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6103846958535213e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 192, - "real_time": 3.6411565330733233e+06, - "cpu_time": 6.6654903958334923e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6076612877280416e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 192, - "real_time": 3.6372006118957265e+06, - "cpu_time": 6.6655398593749031e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6126727090963602e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 192, - "real_time": 3.6376597236085217e+06, - "cpu_time": 6.6587637604171112e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6120905402765846e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 192, - "real_time": 3.6384155597867598e+06, - "cpu_time": 6.6607393958335593e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6111324350710716e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6386876175432308e+06, - "cpu_time": 6.6633584447918311e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6107883336051159e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6384155597867602e+06, - "cpu_time": 6.6654903958334932e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6111324350710716e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5442200015810733e+03, - "cpu_time": 3.3795879776507418e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9561670682025091e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2438927544533202e-04, - "cpu_time": 5.0718988114653693e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2425870082676452e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 97, - "real_time": 7.3375041481376309e+06, - "cpu_time": 1.3683975597937489e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5730034794619665e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 97, - "real_time": 7.3268253442629715e+06, - "cpu_time": 1.3688205484536693e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5796686045305681e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 97, - "real_time": 7.3317209757941281e+06, - "cpu_time": 1.3665614762885526e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5766106089935570e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 97, - "real_time": 7.3285191751939738e+06, - "cpu_time": 1.3712114690721728e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5786101117913599e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 97, - "real_time": 7.3281776870495267e+06, - "cpu_time": 1.3684944742268862e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5788234719387236e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3305494660876468e+06, - "cpu_time": 1.3686971055670058e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5773432553432350e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3285191751939729e+06, - "cpu_time": 1.3684944742268864e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5786101117913599e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2824215596425374e+03, - "cpu_time": 1.6604940175348103e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6727158772753980e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8418834487833956e-04, - "cpu_time": 1.2131931972245407e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8390112521176495e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4500217474236781e+07, - "cpu_time": 2.6617099428570013e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6281281035429630e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.2378869217117222e+07, - "cpu_time": 2.5805156020408280e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 5.4212434773285570e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4483005910807727e+07, - "cpu_time": 2.6558464081633747e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6336281579448242e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4529886047298811e+07, - "cpu_time": 2.6596021918368597e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6186779291690264e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4496674533097111e+07, - "cpu_time": 2.6568231816327170e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6292592033286591e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4077730636511531e+07, - "cpu_time": 2.6428994653061565e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7861873742628059e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4496674533097113e+07, - "cpu_time": 2.6568231816327170e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6292592033286591e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4984627733960398e+05, - "cpu_time": 3.4950160016930418e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5504899894713932e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7471547926632028e-02, - "cpu_time": 1.3224173100690288e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4182009851176345e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.7992481440305710e+07, - "cpu_time": 4.9991184800001070e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7947777793912573e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.8055348768830299e+07, - "cpu_time": 5.0125176679998733e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7840334870160980e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8017396703362465e+07, - "cpu_time": 5.0066055360002793e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7905138875337429e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.8030715137720108e+07, - "cpu_time": 4.9980486320000641e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7882377363746653e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.6444602087140083e+07, - "cpu_time": 4.8867392880001716e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0754300464694691e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7708108827471741e+07, - "cpu_time": 4.9806059208000995e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8465985873570471e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time_median", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8017396703362472e+07, - "cpu_time": 4.9991184800001070e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7905138875337429e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0668707081931294e+05, - "cpu_time": 5.2802100751887984e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2797959513147898e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5504702439982273e-02, - "cpu_time": 1.0601541577777688e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6406064547068044e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.4515822976827621e+07, - "cpu_time": 9.4048266499999046e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9239916292578135e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.4455584287643433e+07, - "cpu_time": 9.4086675600010484e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9294385417311726e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 4.9163064733147621e+07, - "cpu_time": 9.0780930300002187e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.4601041952335920e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.4360303655266762e+07, - "cpu_time": 9.3987927200009838e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9380786704636507e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.4580578207969666e+07, - "cpu_time": 9.4206901100005776e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9181497304256115e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3415070772171028e+07, - "cpu_time": 9.3422140140005469e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0339525534223680e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time_median", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4455584287643433e+07, - "cpu_time": 9.4048266499999046e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9294385417311726e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3783267192510259e+06, - "cpu_time": 1.4786476741288612e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3833899206220707e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.4525387402278266e-02, - "cpu_time": 1.5827593672259183e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7346292904602495e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0663972888141870e+08, - "cpu_time": 1.8139289362500221e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0344362052625809e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 9.3293572776019573e+07, - "cpu_time": 1.7877007449999383e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7546398537970743e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0673420876264572e+08, - "cpu_time": 1.8156231925000554e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0299797808394051e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 9.3309409916400909e+07, - "cpu_time": 1.7753615525001010e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7536631351650496e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0662806872278452e+08, - "cpu_time": 1.8164014887500456e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0349867387711601e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0132099781185389e+08, - "cpu_time": 1.8018031830000323e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3215411427670546e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time_median", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0662806872278452e+08, - "cpu_time": 1.8139289362500221e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0349867387711601e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3208921579662086e+06, - "cpu_time": 1.9034019979196347e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9492233703851557e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.2254441982111159e-02, - "cpu_time": 1.0563872990558484e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4212023630652019e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8973470851778984e+08, - "cpu_time": 3.0833785849998206e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6591744988994684e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8971751257777214e+08, - "cpu_time": 3.0700468399999183e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6596874448258114e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.9149832427501678e+08, - "cpu_time": 3.0900815349997401e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6070559785054073e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8973119184374809e+08, - "cpu_time": 3.0711257175002515e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6592793918897276e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8985195085406303e+08, - "cpu_time": 3.0659702900001663e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6556796976259289e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9010673761367801e+08, - "cpu_time": 3.0761205934999800e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6481754023492699e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time_median", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8973470851778984e+08, - "cpu_time": 3.0711257175002515e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6591744988994684e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7980223950397607e+05, - "cpu_time": 1.0154484934464868e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3043042851512469e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1019179503707925e-03, - "cpu_time": 3.3010685458567130e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0797321630500491e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 385, - "real_time": 1.8328108072247624e+06, - "cpu_time": 2.0716483844155362e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2348187733583660e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 385, - "real_time": 1.8308890198792827e+06, - "cpu_time": 2.0685386753248405e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2371645443971609e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 385, - "real_time": 1.8272812022410284e+06, - "cpu_time": 2.0693189480520138e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2415816432503941e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 385, - "real_time": 1.8306222357242913e+06, - "cpu_time": 2.0687409272727857e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2374905756453928e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 385, - "real_time": 1.8344249327435738e+06, - "cpu_time": 2.0729901480521008e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2328523380207247e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8312056395625877e+06, - "cpu_time": 2.0702474166234557e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2367815749344076e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time_median", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8308890198792827e+06, - "cpu_time": 2.0693189480520138e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2371645443971609e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6824535486578861e+03, - "cpu_time": 1.9708277019654311e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2780137358977577e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4648565353362676e-03, - "cpu_time": 9.5197689229813078e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4655046217438032e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 385, - "real_time": 1.8341784659348272e+06, - "cpu_time": 2.0745803506492670e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4663047528609913e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 385, - "real_time": 1.8296249162076139e+06, - "cpu_time": 2.0693757558443726e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4774204414422316e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 385, - "real_time": 1.8254973282531060e+06, - "cpu_time": 2.0701001792209449e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4875442287495779e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 385, - "real_time": 1.8303534628894459e+06, - "cpu_time": 2.0700816233766561e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4756382666481724e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 385, - "real_time": 1.8351534470143218e+06, - "cpu_time": 2.0740282233764329e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4639318926315745e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8309615240598631e+06, - "cpu_time": 2.0716332264935351e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4741679164665099e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time_median", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8303534628894459e+06, - "cpu_time": 2.0701001792209451e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4756382666481724e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8708728936354623e+03, - "cpu_time": 2.4635051634478723e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4640385736242042e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1141202820321547e-03, - "cpu_time": 1.1891608668671643e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1152622678271009e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 384, - "real_time": 1.8381891872725950e+06, - "cpu_time": 2.0781362369793516e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9131195599674303e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 384, - "real_time": 1.8323820729809387e+06, - "cpu_time": 2.0721786510418856e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9413666732431687e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 384, - "real_time": 1.8283316008478322e+06, - "cpu_time": 2.0727902916665524e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9611753099943288e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 384, - "real_time": 1.8334549618354384e+06, - "cpu_time": 2.0725880651042417e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9361344243756477e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 384, - "real_time": 1.8388720587078447e+06, - "cpu_time": 2.0783460572918837e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9098096425005533e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8342459763289304e+06, - "cpu_time": 2.0748078604167835e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9323211220162269e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time_median", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8334549618354384e+06, - "cpu_time": 2.0727902916665524e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9361344243756477e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3597370239159118e+03, - "cpu_time": 3.1427593167982841e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1239080316607698e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3768551656531437e-03, - "cpu_time": 1.5147230626777039e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3777784101668702e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 384, - "real_time": 1.8399133163976937e+06, - "cpu_time": 2.0832328046873629e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7809534670989502e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 384, - "real_time": 1.8353508168994875e+06, - "cpu_time": 2.0780472161456842e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7853807401985392e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 384, - "real_time": 1.8315382698119720e+06, - "cpu_time": 2.0792235624999360e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7890972053433534e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 384, - "real_time": 1.8357099532977373e+06, - "cpu_time": 2.0789347135418504e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7850314501555298e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 384, - "real_time": 1.8394078672940850e+06, - "cpu_time": 2.0827606692709702e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7814428535746306e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8363840447401956e+06, - "cpu_time": 2.0804397932291608e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7843811432742007e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time_median", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8357099532977373e+06, - "cpu_time": 2.0792235624999360e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7850314501555298e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4133105251505285e+03, - "cpu_time": 2.3799309737715616e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3183521817829627e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8587127975365472e-03, - "cpu_time": 1.1439557066333290e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8596655732945285e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 384, - "real_time": 1.8431266142708107e+06, - "cpu_time": 2.0910555546874339e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5556971231695749e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 384, - "real_time": 1.8364182597376080e+06, - "cpu_time": 2.0847128229168160e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5686859272115894e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 384, - "real_time": 1.8323303315241903e+06, - "cpu_time": 2.0854434635418549e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5766476640423834e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 384, - "real_time": 1.8370261755270197e+06, - "cpu_time": 2.0849235286458286e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5675049638962574e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 384, - "real_time": 1.8440961879377936e+06, - "cpu_time": 2.0925736119791577e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5538276380955622e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8385995137994848e+06, - "cpu_time": 2.0877417963542182e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5644726632830739e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time_median", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8370261755270199e+06, - "cpu_time": 2.0854434635418549e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5675049638962574e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9306179700101729e+03, - "cpu_time": 3.7658691959323405e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5590761705499026e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6817248307767698e-03, - "cpu_time": 1.8038002604098854e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6817644778191316e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8348281711200736e+06, - "cpu_time": 2.0997648015664727e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1435572040507138e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8435429801280529e+06, - "cpu_time": 2.1046466031329297e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1097881314866722e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8391118442801414e+06, - "cpu_time": 2.0996039268930103e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1269183768050686e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8412210985330632e+06, - "cpu_time": 2.1040429373366167e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1187539673767388e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8350228210716620e+06, - "cpu_time": 2.0996756788511332e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1427994515868366e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8387453830265987e+06, - "cpu_time": 2.1015467895560325e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1283634262612060e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time_median", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8391118442801412e+06, - "cpu_time": 2.0997648015664723e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1269183768050686e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8236898309573144e+03, - "cpu_time": 2.5637301800813179e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4821615588811497e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0795102281445143e-03, - "cpu_time": 1.2199253391940541e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0792452211692812e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8477790429134024e+06, - "cpu_time": 2.1281455118111172e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4186977658685654e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8517013654947584e+06, - "cpu_time": 2.1320566062990366e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4156926429114416e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8488822253255951e+06, - "cpu_time": 2.1287681207349505e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4178512639107418e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8484081214448449e+06, - "cpu_time": 2.1288542440944300e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4182149329396474e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8477890995854214e+06, - "cpu_time": 2.1282925590553400e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4186900445446715e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8489119709528047e+06, - "cpu_time": 2.1292234083989752e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4178293300350139e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time_median", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8484081214448449e+06, - "cpu_time": 2.1287681207349510e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4182149329396474e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6263330753102855e+03, - "cpu_time": 1.6123679042637109e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2459547363367579e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7961628290620178e-04, - "cpu_time": 7.5725633012653059e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7877624615509159e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8698023832884841e+06, - "cpu_time": 2.1872669496020530e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8039754611817163e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8673616203458470e+06, - "cpu_time": 2.1871991591512356e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8076404392572796e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8628629490199550e+06, - "cpu_time": 2.1853347586205378e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8144206758517897e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8653164291785243e+06, - "cpu_time": 2.1845858992044027e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8107188238882005e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8677419249619299e+06, - "cpu_time": 2.1869341803715876e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8070687550191736e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8666170613589485e+06, - "cpu_time": 2.1862641893899636e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8087648310396320e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time_median", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8673616203458472e+06, - "cpu_time": 2.1869341803715876e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8076404392572796e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6339592595213498e+03, - "cpu_time": 1.2256716433846289e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9650240533948847e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4110871019274599e-03, - "cpu_time": 5.6062375687845379e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4116611008431336e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8681200551281655e+06, - "cpu_time": 2.2687736923078303e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6130011404864478e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8639018702313344e+06, - "cpu_time": 2.2672884376656031e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6257038889598739e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8667908262959199e+06, - "cpu_time": 2.2662228832890429e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6169978190892494e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8628412919873691e+06, - "cpu_time": 2.2673196631300780e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6289067915245128e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8682278622780489e+06, - "cpu_time": 2.2675687241379111e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6126772390676403e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8659763811841682e+06, - "cpu_time": 2.2674346801060932e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6194573758255446e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time_median", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8667908262959202e+06, - "cpu_time": 2.2673196631300785e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6169978190892494e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4728630116158683e+03, - "cpu_time": 9.1021820952802477e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4500508717726218e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3252381094162424e-03, - "cpu_time": 4.0143084055035955e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3257598329372768e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 369, - "real_time": 1.9095951701050024e+06, - "cpu_time": 2.4664495149051659e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0982181107447422e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 369, - "real_time": 1.9109276601941220e+06, - "cpu_time": 2.4651477750676051e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0974523231229801e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 369, - "real_time": 1.9118117900794942e+06, - "cpu_time": 2.4674042276423858e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0969447991074474e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 369, - "real_time": 1.9086663908423570e+06, - "cpu_time": 2.4641436937668803e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0987525164491727e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 369, - "real_time": 1.9085740350025294e+06, - "cpu_time": 2.4647235880761361e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0988056850502112e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9099150092447014e+06, - "cpu_time": 2.4655737598916348e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0980346868949108e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time_median", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9095951701050024e+06, - "cpu_time": 2.4651477750676055e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0982181107447422e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4215129604042727e+03, - "cpu_time": 1.3291823936055871e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1706252588158764e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.4428074208727590e-04, - "cpu_time": 5.3909658483062629e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4411358369026270e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 350, - "real_time": 2.0065896409297630e+06, - "cpu_time": 2.8746787628571317e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0902649522582750e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 350, - "real_time": 2.0043427853046786e+06, - "cpu_time": 2.8733051257141340e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0926081260907812e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 350, - "real_time": 2.0026024241399553e+06, - "cpu_time": 2.8732762142856573e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0944267066895721e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 350, - "real_time": 2.0070120392899427e+06, - "cpu_time": 2.8735481828571861e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0898250323819160e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 350, - "real_time": 2.0055999224340275e+06, - "cpu_time": 2.8736421000001295e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0912964510437987e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0052293624196735e+06, - "cpu_time": 2.8736900771428477e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0916842536928689e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time_median", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0055999224340278e+06, - "cpu_time": 2.8735481828571856e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0912964510437987e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7925144964453270e+03, - "cpu_time": 5.7432684741149103e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8705680942430296e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.9391993257186930e-04, - "cpu_time": 1.9985691984659415e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9428798392517475e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 341, - "real_time": 2.0500296864063202e+06, - "cpu_time": 3.6183503900295170e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0919446462773614e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 341, - "real_time": 2.0528740206558551e+06, - "cpu_time": 3.6185388651026520e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0862751029018307e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 341, - "real_time": 2.0580752267941963e+06, - "cpu_time": 3.6252006363635818e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0759481921691899e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 341, - "real_time": 2.0502661918139744e+06, - "cpu_time": 3.6177323079180527e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0914726260877242e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 341, - "real_time": 2.0465908354951227e+06, - "cpu_time": 3.6186279501463631e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0988202695486913e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0515671922330938e+06, - "cpu_time": 3.6196900299120336e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0888921673969598e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time_median", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0502661918139749e+06, - "cpu_time": 3.6185388651026515e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0914726260877242e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2685760802226723e+03, - "cpu_time": 3.1002938457600371e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4991047761231884e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0806416169954463e-03, - "cpu_time": 8.5650810432388912e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0785837405768088e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 195, - "real_time": 3.5908633544563483e+06, - "cpu_time": 6.6031943846155629e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6721956097769823e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 195, - "real_time": 3.6105508653399274e+06, - "cpu_time": 6.6226114820513735e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6467191920921612e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 195, - "real_time": 3.5892773156937882e+06, - "cpu_time": 6.5987640153841702e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6742601711612396e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 195, - "real_time": 3.5935004492505239e+06, - "cpu_time": 6.5983230307694655e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6687669131916008e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 195, - "real_time": 3.5943423588879597e+06, - "cpu_time": 6.6113076564102490e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6676733390501623e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5957068687257096e+06, - "cpu_time": 6.6068401138461642e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6659230450544300e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time_median", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5935004492505239e+06, - "cpu_time": 6.6031943846155629e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6687669131916008e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5421483267262538e+03, - "cpu_time": 1.0243905550493399e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1054318426794119e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3756520313218759e-03, - "cpu_time": 1.5504999930337228e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3691600397291093e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 106, - "real_time": 7.2510257793836435e+06, - "cpu_time": 1.3545328933961207e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6275427809680490e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 106, - "real_time": 7.2560748085379601e+06, - "cpu_time": 1.3479260905659482e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6243227757957668e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 106, - "real_time": 7.2422000702540828e+06, - "cpu_time": 1.3489682811322346e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6331821372649250e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 106, - "real_time": 7.2552945051904554e+06, - "cpu_time": 1.3526208141510289e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6248201194307241e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 106, - "real_time": 7.2609805633788398e+06, - "cpu_time": 1.3521699499999570e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6211984327893190e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2531151453489978e+06, - "cpu_time": 1.3512436058490580e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6262132492497568e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time_median", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2552945051904563e+06, - "cpu_time": 1.3521699499999572e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.6248201194307241e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0512114346917388e+03, - "cpu_time": 2.7275098064631235e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4998927614599885e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.7216317311786668e-04, - "cpu_time": 2.0185181966128778e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7269462495913823e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4362072933237163e+07, - "cpu_time": 2.6206644102038417e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6726447019144812e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4397576755406905e+07, - "cpu_time": 2.6246826244900782e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6611221554903507e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4368730939316506e+07, - "cpu_time": 2.6204028367346283e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6704795491975603e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4353403498475648e+07, - "cpu_time": 2.6196851673473377e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6754669724938097e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4432871714234352e+07, - "cpu_time": 2.6308722387753103e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6497235843795519e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4382931168134117e+07, - "cpu_time": 2.6232614555102389e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6658873926951504e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time_median", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4368730939316507e+07, - "cpu_time": 2.6206644102038421e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6704795491975603e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2469782522715395e+04, - "cpu_time": 4.6810769551008379e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0517766674209882e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2575219295113730e-03, - "cpu_time": 1.7844492569614424e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2541835644547172e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.7870135307312012e+07, - "cpu_time": 4.9957665559995800e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8158262067994566e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.7095507606863976e+07, - "cpu_time": 4.8344358919994190e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9535048373110847e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.7820502817630768e+07, - "cpu_time": 4.9917401160000734e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8244177641153851e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.7901194319128990e+07, - "cpu_time": 4.9941238720002726e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8104653322306223e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.7906442582607269e+07, - "cpu_time": 4.9950326520001911e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8095606454565220e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7718756526708603e+07, - "cpu_time": 4.9622198175999083e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8427549571826143e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time_median", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7870135307312012e+07, - "cpu_time": 4.9941238720002733e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8158262067994566e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5007737098481075e+05, - "cpu_time": 7.1449482337677642e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2192098384280294e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2629620331182288e-02, - "cpu_time": 1.4398693521045149e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2842297191196722e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.4403833299875259e+07, - "cpu_time": 9.3927522900003165e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9341276104640865e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.3257106617093086e+07, - "cpu_time": 9.0991950300008282e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0403687517234468e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.4294505715370178e+07, - "cpu_time": 9.3782965700006574e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9440629850693874e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.4274409636855125e+07, - "cpu_time": 9.3694914499997139e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9458936135109701e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.4221912845969200e+07, - "cpu_time": 9.3641491300013512e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9506821487939301e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4090353623032570e+07, - "cpu_time": 9.3207768940005749e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9630270219123640e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time_median", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4274409636855125e+07, - "cpu_time": 9.3694914499997139e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9458936135109701e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7048714192596741e+05, - "cpu_time": 1.2434000968306987e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3653474722462125e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.6981709382951081e-03, - "cpu_time": 1.3340090756072356e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7957358542935099e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0617277398705482e+08, - "cpu_time": 1.8065783187500983e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0565779892447596e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0485049057751894e+08, - "cpu_time": 1.7588086662502179e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1203471633075113e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0667163506150246e+08, - "cpu_time": 1.8086895812498939e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0329303726380720e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0466591082513332e+08, - "cpu_time": 1.7543277575001070e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1293769649313717e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0620841477066278e+08, - "cpu_time": 1.8069827150000605e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0548811330935726e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0571384504437447e+08, - "cpu_time": 1.7870774077500755e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0788227246430578e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time_median", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0617277398705482e+08, - "cpu_time": 1.8065783187500983e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0565779892447596e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9667772482566908e+05, - "cpu_time": 2.7907230995780118e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3168698871199720e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4821219439069635e-03, - "cpu_time": 1.5616128811630620e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4997451597867372e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 2.0105309784412384e+08, - "cpu_time": 3.1200736925001138e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3405883098228626e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 2.0107398554682732e+08, - "cpu_time": 3.1188340425001115e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3400335258682213e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 2.0187630504369736e+08, - "cpu_time": 3.1252353025001866e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3188105645562611e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 2.0105969905853271e+08, - "cpu_time": 3.1281694099999416e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3404129670332947e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 2.0167966559529305e+08, - "cpu_time": 3.1273674524999249e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3239964516534767e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0134855061769485e+08, - "cpu_time": 3.1239359800000560e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3327683637868233e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time_median", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0107398554682732e+08, - "cpu_time": 3.1252353025001866e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3400335258682213e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9820704580748687e+05, - "cpu_time": 4.2524170485393441e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0537322913332399e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_coarse/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9777000856766626e-03, - "cpu_time": 1.3612369381971994e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9759573629501877e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - } - ] -} diff --git a/results/implicit_managed_GPURdHost_fine.json b/results/implicit_managed_GPURdHost_fine.json deleted file mode 100644 index cc32965..0000000 --- a/results/implicit_managed_GPURdHost_fine.json +++ /dev/null @@ -1,25272 +0,0 @@ -{ - "context": { - "date": "2023-10-09T14:27:09-04:00", - "host_name": "frontier10485", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1728, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [2.12,2.56,2.44], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8628192977173186e+06, - "cpu_time": 2.0664527486772484e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1988176765289041e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8669374079012962e+06, - "cpu_time": 2.0662510767195774e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1939675013553281e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8616810934126892e+06, - "cpu_time": 2.0656471375661376e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2001620011575297e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8662707093065523e+06, - "cpu_time": 2.0651398915343892e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1947512649555248e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8700773003084583e+06, - "cpu_time": 2.0694383518518514e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1902837916509593e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8655571617292627e+06, - "cpu_time": 2.0665858412698410e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1955964471296491e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8662707093065523e+06, - "cpu_time": 2.0662510767195772e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1947512649555248e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3677027538529051e+03, - "cpu_time": 1.6761960537402726e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9627234291984546e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8051994454735658e-03, - "cpu_time": 8.1109432778766739e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8048505381665237e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8654093254693579e+06, - "cpu_time": 2.0657390846560840e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3915294558414416e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8707871068924698e+06, - "cpu_time": 2.0711520185185184e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3789055258177295e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8606127327575691e+06, - "cpu_time": 2.0655969894179872e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4028506608459223e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8650939872179786e+06, - "cpu_time": 2.0656543465608438e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3922719477635520e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8695003439716331e+06, - "cpu_time": 2.0702673703703738e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3819194933105083e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8662806992618020e+06, - "cpu_time": 2.0676819619047616e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3894954167158306e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8654093254693579e+06, - "cpu_time": 2.0657390846560840e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3915294558414416e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0301130208669406e+03, - "cpu_time": 2.7820287602332965e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4835303328055106e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1594356210515556e-03, - "cpu_time": 1.3454819510397402e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1605058059044465e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8673297063938824e+06, - "cpu_time": 2.0700095968169754e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7740263242746610e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8710228408389138e+06, - "cpu_time": 2.0744616366047764e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7567076373337470e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8674654849302839e+06, - "cpu_time": 2.0733772705570280e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7733883877439629e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8719552528772091e+06, - "cpu_time": 2.0777826737400547e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7523459627668280e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8714756744006521e+06, - "cpu_time": 2.0778288859416440e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7545888114453033e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8698497918881886e+06, - "cpu_time": 2.0746920127320960e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7622114247129019e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8710228408389140e+06, - "cpu_time": 2.0744616366047766e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7567076373337470e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2631976452603608e+03, - "cpu_time": 3.2824837374181725e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0609425080883271e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2103633431298066e-03, - "cpu_time": 1.5821547088792107e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2108159192507609e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8702584853570596e+06, - "cpu_time": 2.0780134217506647e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7520572828062378e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8746442687723956e+06, - "cpu_time": 2.0829402015915138e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7479582951200664e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8701570627924339e+06, - "cpu_time": 2.0782183687002666e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7521523005705360e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8741485756515916e+06, - "cpu_time": 2.0822133713527906e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7484206122029275e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8749392845168270e+06, - "cpu_time": 2.0826716047745442e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7476832594312157e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8728295354180620e+06, - "cpu_time": 2.0808113936339561e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7496543500261970e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8741485756515916e+06, - "cpu_time": 2.0822133713527906e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7484206122029275e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4102164787451470e+03, - "cpu_time": 2.4753876109039179e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2526513409896572e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2869385243901160e-03, - "cpu_time": 1.1896261326120809e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2874836340994603e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8705628358463163e+06, - "cpu_time": 2.0840395862068955e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5035444275973193e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8772365877505785e+06, - "cpu_time": 2.0905449469495974e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4910889989912942e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8709626312088778e+06, - "cpu_time": 2.0845369363395195e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5027957751168706e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8779292090452246e+06, - "cpu_time": 2.0921545225464161e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4898014091446906e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8702097269070314e+06, - "cpu_time": 2.0842613262599451e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5042059217809759e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8733801981516059e+06, - "cpu_time": 2.0871074636604753e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.4982873065262303e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8709626312088780e+06, - "cpu_time": 2.0845369363395195e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5027957751168706e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8535467118190159e+03, - "cpu_time": 3.9181971503318514e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1906137298912116e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0570019452651233e-03, - "cpu_time": 1.8773336871978402e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0554668898911652e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8728798400077624e+06, - "cpu_time": 2.0981805763157867e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9984201442126021e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8670808081591723e+06, - "cpu_time": 2.0974538973684269e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0201567831029758e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8757696530404869e+06, - "cpu_time": 2.1018046947368416e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9876383695376337e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8673089928358279e+06, - "cpu_time": 2.0971973078947351e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0192989217571735e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8720268951591081e+06, - "cpu_time": 2.0973531552631585e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0016088090903133e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8710132378404713e+06, - "cpu_time": 2.0983979263157896e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0054246055401400e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8720268951591079e+06, - "cpu_time": 2.0974538973684269e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0016088090903133e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7523534153405540e+03, - "cpu_time": 1.9414900139252593e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4049080738610623e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0055194369824614e-03, - "cpu_time": 9.2522490113873784e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0054574175989428e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8719649071744359e+06, - "cpu_time": 2.1206745356200528e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4003681318774450e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8759729443726162e+06, - "cpu_time": 2.1203973430079189e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3973762296858132e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8796512702652584e+06, - "cpu_time": 2.1242366306068548e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3946416771394300e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8788765876162010e+06, - "cpu_time": 2.1238162348284936e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3952167041082332e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8791353774175914e+06, - "cpu_time": 2.1242754617414167e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3950245583703095e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8771202173692207e+06, - "cpu_time": 2.1226800411609476e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3965254602362463e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8788765876162010e+06, - "cpu_time": 2.1238162348284936e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3952167041082332e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2189048511765131e+03, - "cpu_time": 1.9679962467844557e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3981306139366137e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7148101764562530e-03, - "cpu_time": 9.2712806858451864e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7172122401054749e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 369, - "real_time": 1.9024523606222265e+06, - "cpu_time": 2.1845281815718277e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7558535017850512e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 369, - "real_time": 1.9027803509324528e+06, - "cpu_time": 2.1854544471544656e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7553784636417651e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 369, - "real_time": 1.9027395724435020e+06, - "cpu_time": 2.1846839485094836e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7554375154278642e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 369, - "real_time": 1.9006010313419914e+06, - "cpu_time": 2.1838460325203254e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7585379117142045e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 369, - "real_time": 1.8969101671679679e+06, - "cpu_time": 2.1813700325203235e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7639052659132874e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9010966965016283e+06, - "cpu_time": 2.1839765284552854e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7578225316964340e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9024523606222265e+06, - "cpu_time": 2.1845281815718277e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7558535017850512e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5072031540156418e+03, - "cpu_time": 1.5652362615521006e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6417809579929436e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3188193733803032e-03, - "cpu_time": 7.1669097225105427e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3205276685272259e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 370, - "real_time": 1.9021051190950831e+06, - "cpu_time": 2.2657980675675552e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5127132011445022e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 370, - "real_time": 1.8997820934305927e+06, - "cpu_time": 2.2639750513513484e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5194540659476388e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 370, - "real_time": 1.9044956182935147e+06, - "cpu_time": 2.2663902837837827e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5057937121407270e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 370, - "real_time": 1.8992069846717641e+06, - "cpu_time": 2.2632703486486604e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5211254405807865e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 370, - "real_time": 1.9049124882676061e+06, - "cpu_time": 2.2664321459459425e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5045888273513901e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9021004607517119e+06, - "cpu_time": 2.2651731794594582e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5127350494330096e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9021051190950833e+06, - "cpu_time": 2.2657980675675557e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5127132011445022e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6168363992322329e+03, - "cpu_time": 1.4588609216729265e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5843164074292150e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3757614033688087e-03, - "cpu_time": 6.4403946457685713e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3757810486845852e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 361, - "real_time": 1.9540153635688995e+06, - "cpu_time": 2.4688007617728710e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0732525644883721e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 361, - "real_time": 1.9504590175395776e+06, - "cpu_time": 2.4647507562326831e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0752094666646571e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 361, - "real_time": 1.9495757019348505e+06, - "cpu_time": 2.4647675761772953e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0756966235877314e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 361, - "real_time": 1.9480754546189057e+06, - "cpu_time": 2.4640008698060936e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0765250365573020e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 361, - "real_time": 1.9467963291773277e+06, - "cpu_time": 2.4577503878116473e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0772323578842010e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9497843733679124e+06, - "cpu_time": 2.4640140703601181e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0755832098364530e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9495757019348505e+06, - "cpu_time": 2.4647507562326831e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0756966235877314e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7499444530560027e+03, - "cpu_time": 3.9767067119393605e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5158480488492241e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4103838817345498e-03, - "cpu_time": 1.6139139624954174e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4093266192577655e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 342, - "real_time": 2.0597699787249865e+06, - "cpu_time": 2.8785452456140271e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0362972775223701e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 342, - "real_time": 2.0599131242982086e+06, - "cpu_time": 2.8796132982456163e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0361557730396795e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 342, - "real_time": 2.0572600111144744e+06, - "cpu_time": 2.8785397953216354e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0387816694729950e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 342, - "real_time": 2.0580333967322800e+06, - "cpu_time": 2.8787064590643304e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0380155184360294e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 342, - "real_time": 2.0556787480954190e+06, - "cpu_time": 2.8781602514619753e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0403499349720922e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0581310517930738e+06, - "cpu_time": 2.8787130099415169e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0379200346886334e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0580333967322796e+06, - "cpu_time": 2.8785452456140267e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0380155184360294e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7779135031814235e+03, - "cpu_time": 5.4181455562995995e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7608170703397896e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.6384853949532489e-04, - "cpu_time": 1.8821416159194257e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6402657629734648e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 329, - "real_time": 2.1137411884487942e+06, - "cpu_time": 3.6210186352583473e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9686069637296162e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 329, - "real_time": 2.1204835587353827e+06, - "cpu_time": 3.6252245258358582e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9559882298747039e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 329, - "real_time": 2.1215714758409238e+06, - "cpu_time": 3.6237042249240056e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9539596452554216e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 329, - "real_time": 2.1223651594128516e+06, - "cpu_time": 3.6237562978723450e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9524810152465434e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 329, - "real_time": 2.1191559626514199e+06, - "cpu_time": 3.6242782826747820e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9584665535916681e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1194634690178749e+06, - "cpu_time": 3.6235963933130680e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9579004815395908e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1204835587353827e+06, - "cpu_time": 3.6237562978723450e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9559882298747039e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4184476746944410e+03, - "cpu_time": 1.5650736660713665e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3934871235281294e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6128835078617772e-03, - "cpu_time": 4.3191169661155717e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6153733913595310e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 191, - "real_time": 3.6690382381988913e+06, - "cpu_time": 6.6208500994764548e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5726468111806412e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 191, - "real_time": 3.6646076831576554e+06, - "cpu_time": 6.6229438586387513e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5781751965175438e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 191, - "real_time": 3.6663928542149630e+06, - "cpu_time": 6.6235126858638870e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5759460775493708e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 191, - "real_time": 3.6693583145074509e+06, - "cpu_time": 6.6257190209423909e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5722479414638624e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 191, - "real_time": 3.6672347759174583e+06, - "cpu_time": 6.6208939528795788e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5748955344160433e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6673263731992841e+06, - "cpu_time": 6.6227839235602133e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5747823122254925e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6672347759174583e+06, - "cpu_time": 6.6229438586387504e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5748955344160433e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9577021321532980e+03, - "cpu_time": 2.0299713731159161e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4424492164055323e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.3382271795063816e-04, - "cpu_time": 3.0651330264519082e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3389408494441677e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 96, - "real_time": 7.4580427559946356e+06, - "cpu_time": 1.3661284249999905e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4990935420730295e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 96, - "real_time": 7.4633144201167552e+06, - "cpu_time": 1.3685648604166694e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4959156362964916e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 96, - "real_time": 7.4622077809181064e+06, - "cpu_time": 1.3696042906249890e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4965823768407125e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 96, - "real_time": 7.4593094420076041e+06, - "cpu_time": 1.3718653770833366e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4983295385275154e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 96, - "real_time": 7.4559328592537595e+06, - "cpu_time": 1.3697755499999965e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5003667057375240e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4597614516581725e+06, - "cpu_time": 1.3691877006249964e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4980575598950548e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4593094420076041e+06, - "cpu_time": 1.3696042906249892e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4983295385275154e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0176339658508596e+03, - "cpu_time": 2.0878315667751136e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8195732823714465e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0452150989092194e-04, - "cpu_time": 1.5248687713321383e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0452423254759313e-04, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 48, - "real_time": 1.4645315493301800e+07, - "cpu_time": 2.6583978145833537e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5822750647258501e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 48, - "real_time": 1.4358375493126610e+07, - "cpu_time": 2.5624060833333280e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6738479594801779e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 48, - "real_time": 1.4660928922239691e+07, - "cpu_time": 2.6587644395833421e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5773950856688318e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 48, - "real_time": 1.4629838774756839e+07, - "cpu_time": 2.6576874208333358e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5871225946654634e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 48, - "real_time": 1.4638855548885962e+07, - "cpu_time": 2.6584311687500119e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5842971655736494e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4586662846462181e+07, - "cpu_time": 2.6391373854166750e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6009875740227947e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4638855548885962e+07, - "cpu_time": 2.6583978145833544e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5842971655736494e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2812000005459548e+05, - "cpu_time": 4.2895897226946254e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0884614058075197e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7833661066396302e-03, - "cpu_time": 1.6253756800983562e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8860518313307324e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.8248011246323586e+07, - "cpu_time": 4.9986145400000058e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7514045087853088e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.8171223923563957e+07, - "cpu_time": 5.0085204080000378e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7643555837037287e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8239275068044662e+07, - "cpu_time": 5.0077168599999599e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7528744160957479e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.8187588974833488e+07, - "cpu_time": 5.0072793200000092e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7615895108954725e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.7786782085895538e+07, - "cpu_time": 4.8496887599999927e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8302724505882378e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8126576259732254e+07, - "cpu_time": 4.9743639776000015e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7720992940136995e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8187588974833488e+07, - "cpu_time": 5.0072793200000100e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7615895108954725e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9275860760632119e+05, - "cpu_time": 6.9811345653269440e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2986386597295556e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8532552923011233e-03, - "cpu_time": 1.4034225474379452e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9123428841212330e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.4552702233195305e+07, - "cpu_time": 9.3672381099999309e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9206628638215666e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.4461663216352463e+07, - "cpu_time": 9.3779136599999905e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9288883252357330e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.0718251988291740e+07, - "cpu_time": 8.9949174599999532e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2926795675444031e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.4467422887682915e+07, - "cpu_time": 9.3814714299999475e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9283671187002888e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.4440735653042793e+07, - "cpu_time": 9.3578731399999529e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9307830392074547e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3728155195713043e+07, - "cpu_time": 9.2958827599999562e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0002761829018898e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4461663216352463e+07, - "cpu_time": 9.3672381099999309e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9288883252357330e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6831307718034324e+06, - "cpu_time": 1.6849999553220223e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6350417172232494e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1326792548010823e-02, - "cpu_time": 1.8126303857580389e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2699028161967639e-02, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0655531473457813e+08, - "cpu_time": 1.8058430624999923e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0384245341239719e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 9.4823699444532394e+07, - "cpu_time": 1.7365919262500107e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6617798624704084e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0617835167795420e+08, - "cpu_time": 1.7996775199999958e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0563123604363737e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 9.4792198389768600e+07, - "cpu_time": 1.7452520012500018e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6636613679164038e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0616035200655460e+08, - "cpu_time": 1.8008009787500077e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0571696669473391e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0170198325067759e+08, - "cpu_time": 1.7776330977500018e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2954695583788996e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0616035200655460e+08, - "cpu_time": 1.7996775199999958e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0571696669473391e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.2953488325637924e+06, - "cpu_time": 3.3732115788200079e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3533699302803844e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1899961351263522e-02, - "cpu_time": 1.8975859434039417e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3325261212661008e-02, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.9139072671532631e+08, - "cpu_time": 3.0807746949999881e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6102081977936096e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.9146832451224327e+08, - "cpu_time": 3.0902189925000203e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6079345068449717e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.9113072752952576e+08, - "cpu_time": 3.0917194349999732e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6178398830932560e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.9208712503314018e+08, - "cpu_time": 3.0960023975000441e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5898687838383274e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.9281717017292976e+08, - "cpu_time": 3.0913404999999726e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5687044003239193e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9177881479263306e+08, - "cpu_time": 3.0900112039999998e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5989111543788166e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9146832451224327e+08, - "cpu_time": 3.0913404999999726e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6079345068449717e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7828290019170276e+05, - "cpu_time": 5.6110550505858310e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9758247049954608e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5367978518644912e-03, - "cpu_time": 1.8158688367609659e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5289445581757456e-03, - "dst_gpu": NaN, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8632594538784383e+06, - "cpu_time": 2.0649631609497985e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1982982517405380e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8607154964284459e+06, - "cpu_time": 2.0623770131926078e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2013037500155587e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8656902797288252e+06, - "cpu_time": 2.0673825013193106e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.1954340677571343e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8611262661445148e+06, - "cpu_time": 2.0625407546174033e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2008178996287133e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8565470491875992e+06, - "cpu_time": 2.0623606253298142e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2062462687343992e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8614677090735647e+06, - "cpu_time": 2.0639248110817871e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2004200475752684e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8611262661445145e+06, - "cpu_time": 2.0625407546174030e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2008178996287133e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3887959968310643e+03, - "cpu_time": 2.2243965415709904e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0076826712036977e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8204967941762669e-03, - "cpu_time": 1.0777507638008836e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8213261943418144e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8658135485035826e+06, - "cpu_time": 2.0683050554090119e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3905780438619591e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8620457329781477e+06, - "cpu_time": 2.0649793403693498e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3994622983280607e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8668545958402352e+06, - "cpu_time": 2.0694971583113610e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3881296477259593e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8625426178760913e+06, - "cpu_time": 2.0649337678100371e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3982886197479675e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8574922677277867e+06, - "cpu_time": 2.0651126992084386e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4102471608245354e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8629497525851685e+06, - "cpu_time": 2.0665656042216397e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3973411540976958e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8625426178760913e+06, - "cpu_time": 2.0651126992084384e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3982886197479675e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6815852223612828e+03, - "cpu_time": 2.1742674556423526e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6970320135507463e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9762128405516246e-03, - "cpu_time": 1.0521163476255948e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9777933321016841e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8675173874370072e+06, - "cpu_time": 2.0719363201058132e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7731445555564575e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8618907160806302e+06, - "cpu_time": 2.0647205608465162e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7996571756311841e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8666060695303949e+06, - "cpu_time": 2.0698128386243146e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7774277966008782e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8612473348896920e+06, - "cpu_time": 2.0648185978835633e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8026989712095466e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8561980243402389e+06, - "cpu_time": 2.0650354603174550e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8266444555792902e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8626919064555925e+06, - "cpu_time": 2.0672647555555322e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7959145909154713e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8618907160806297e+06, - "cpu_time": 2.0650354603174548e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7996571756311841e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5690572668125587e+03, - "cpu_time": 3.3816643093493249e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1590480615832901e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4529323668489823e-03, - "cpu_time": 1.6358157803742831e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4546032584413465e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8695923067247753e+06, - "cpu_time": 2.0757830873015665e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7526815810129352e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8635385504961642e+06, - "cpu_time": 2.0697154338624806e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7583752153276127e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8677776931360348e+06, - "cpu_time": 2.0738081666666272e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7543843745655779e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8641705015811592e+06, - "cpu_time": 2.0692127169311829e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7577791286905739e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8592921918387113e+06, - "cpu_time": 2.0697394708994573e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7623910939783335e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8648742487553689e+06, - "cpu_time": 2.0716517751322631e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7571222787150066e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8641705015811590e+06, - "cpu_time": 2.0697394708994571e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7577791286905739e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0040220285959804e+03, - "cpu_time": 2.9611270906739401e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7741764511446730e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1470734722559954e-03, - "cpu_time": 1.4293556118932628e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1479304524581804e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8653586467691986e+06, - "cpu_time": 2.0760680449735860e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5133190131296396e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8612481623662577e+06, - "cpu_time": 2.0761807169312381e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5210780230768487e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8720705885489078e+06, - "cpu_time": 2.0821512566137863e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5007226971499354e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8659059450901286e+06, - "cpu_time": 2.0759388835978864e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5122885037399046e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8614919658469423e+06, - "cpu_time": 2.0772519576719368e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5206168601529479e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8652150617242870e+06, - "cpu_time": 2.0775181719576865e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5136050194498554e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8653586467691984e+06, - "cpu_time": 2.0761807169312381e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5133190131296396e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3901571145255748e+03, - "cpu_time": 2.6420706564912762e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2580405412694599e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3537002271829823e-03, - "cpu_time": 1.2717437046539048e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3503041735073761e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8664656728981633e+06, - "cpu_time": 2.0897463952254374e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0224704318551630e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8700179552834786e+06, - "cpu_time": 2.0897537559681770e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0091305610020518e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8664126735877257e+06, - "cpu_time": 2.0895803023872476e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0226698443943739e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8751188918972260e+06, - "cpu_time": 2.0951757082228304e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.9900634336515427e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8659356270672195e+06, - "cpu_time": 2.0890979893899495e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0244652655039415e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8687901641467628e+06, - "cpu_time": 2.0906708302387286e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0137599072814152e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8664656728981629e+06, - "cpu_time": 2.0897463952254374e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0224704318551630e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8975751717399280e+03, - "cpu_time": 2.5324202993816457e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4601529216147191e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0856141296738107e-03, - "cpu_time": 1.2112955625312258e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0818404691880666e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8701654608640696e+06, - "cpu_time": 2.1090598829787755e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4017155459543243e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8690748361513352e+06, - "cpu_time": 2.1086644361702004e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4025334616338217e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8705612411066156e+06, - "cpu_time": 2.1088341170212440e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4014189658121902e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8696978251992210e+06, - "cpu_time": 2.1087891648936635e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4020661331842107e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8729858687599536e+06, - "cpu_time": 2.1092100319148973e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3996047934603879e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8704970464162391e+06, - "cpu_time": 2.1089115265957564e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4014677800089869e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8701654608640694e+06, - "cpu_time": 2.1088341170212440e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4017155459543243e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4974764761038866e+03, - "cpu_time": 2.1973469759289509e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1211816891119833e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0057676593126015e-04, - "cpu_time": 1.0419341675636573e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0000532663319142e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8914088940558336e+06, - "cpu_time": 2.1587004799999553e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7719442456239361e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8907149481431891e+06, - "cpu_time": 2.1587115680000200e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7729616276366067e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8940728550466397e+06, - "cpu_time": 2.1613727999999807e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7680455828458083e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8959424606679627e+06, - "cpu_time": 2.1609918453333043e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7653159886259794e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8944312629755586e+06, - "cpu_time": 2.1600144400000167e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7675218956031567e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8933140841778372e+06, - "cpu_time": 2.1599582266666559e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7691578680670977e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8940728550466399e+06, - "cpu_time": 2.1600144400000167e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7680455828458083e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1861748669319268e+03, - "cpu_time": 1.2458561019575714e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1978941780490486e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1546815635089214e-03, - "cpu_time": 5.7679638734506105e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1548255211181635e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 369, - "real_time": 1.8997876210041030e+06, - "cpu_time": 2.2289299566395353e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5194380066851449e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 369, - "real_time": 1.9070053827093262e+06, - "cpu_time": 2.2340098428183720e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4985476680210733e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 369, - "real_time": 1.8994467825752487e+06, - "cpu_time": 2.2292730135501060e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5204284195756841e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 369, - "real_time": 1.9062721741677271e+06, - "cpu_time": 2.2334628238482689e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5006625717432261e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 369, - "real_time": 1.8999207456316042e+06, - "cpu_time": 2.2301946883468796e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5190512678538835e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9024865412176021e+06, - "cpu_time": 2.2311740650406326e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5116255867758024e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8999207456316047e+06, - "cpu_time": 2.2301946883468800e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5190512678538835e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8032405647663413e+03, - "cpu_time": 2.3921355772161587e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1010042769762522e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9990893403809555e-03, - "cpu_time": 1.0721420684730819e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9976035375442094e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 360, - "real_time": 1.9502147771870822e+06, - "cpu_time": 2.4105063972221785e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0753441233918116e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 360, - "real_time": 1.9480943243252111e+06, - "cpu_time": 2.4085992916666674e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0765146090790136e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 360, - "real_time": 1.9496294475781422e+06, - "cpu_time": 2.4095967444444629e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0756669697439749e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 360, - "real_time": 1.9498054246974385e+06, - "cpu_time": 2.4091526638888656e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0755698868390553e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 360, - "real_time": 1.9499205250111925e+06, - "cpu_time": 2.4096392972222390e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0755063978763762e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9495328997598130e+06, - "cpu_time": 2.4094988788888827e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0757203973860462e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9498054246974383e+06, - "cpu_time": 2.4095967444444629e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0755698868390553e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3191056727917351e+02, - "cpu_time": 7.0240838749577017e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5925430375773291e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2672302036127045e-04, - "cpu_time": 2.9151637863375105e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2692720605995844e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 349, - "real_time": 2.0101800228050111e+06, - "cpu_time": 2.7194888796561719e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0865315307169633e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 349, - "real_time": 2.0081514147721382e+06, - "cpu_time": 2.7180712349570254e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0886393173076153e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 349, - "real_time": 2.0095606859543903e+06, - "cpu_time": 2.7179635787964952e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0871745896083853e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 349, - "real_time": 2.0084356119253146e+06, - "cpu_time": 2.7178388767908197e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0883437711897974e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 349, - "real_time": 2.0078910090413510e+06, - "cpu_time": 2.7180354040114642e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0889101953808398e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0088437488996412e+06, - "cpu_time": 2.7182795948423953e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0879198808407204e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0084356119253146e+06, - "cpu_time": 2.7180354040114642e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0883437711897974e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8148385911700484e+02, - "cpu_time": 6.8181949602716281e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0199227704096031e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.8858148357960624e-04, - "cpu_time": 2.5082758128370321e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8848750364833052e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 329, - "real_time": 2.1438795229629544e+06, - "cpu_time": 3.3838003069908815e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9128168864668770e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 329, - "real_time": 2.1325885371296559e+06, - "cpu_time": 3.3817152097264286e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9335332878092813e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 329, - "real_time": 2.1440682261842545e+06, - "cpu_time": 3.3835034285714314e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9124725125603862e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 329, - "real_time": 2.1262551664224737e+06, - "cpu_time": 3.3752654164134283e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9452499081350780e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 329, - "real_time": 2.1438201667180448e+06, - "cpu_time": 3.3838147750759753e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9129252211681752e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1381223238834767e+06, - "cpu_time": 3.3816198273556293e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9233995632279596e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1438201667180448e+06, - "cpu_time": 3.3835034285714314e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9129252211681752e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2525258317757580e+03, - "cpu_time": 3.6574539193023475e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5175928898768602e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8597070614681565e-03, - "cpu_time": 1.0815686286540424e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8680559178843037e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 212, - "real_time": 3.3054854534127098e+06, - "cpu_time": 5.6353435896226671e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0755679419731102e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 212, - "real_time": 3.3067156723261159e+06, - "cpu_time": 5.6373989528300976e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0736796454586105e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 212, - "real_time": 3.3043812485938929e+06, - "cpu_time": 5.6344863207547162e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0772640133880367e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 212, - "real_time": 3.3054009007448154e+06, - "cpu_time": 5.6345207641509436e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0756977757885714e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 212, - "real_time": 3.3054771176363640e+06, - "cpu_time": 5.6359466556603294e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0755807415774298e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3054920785427801e+06, - "cpu_time": 5.6355392566037504e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0755580236371527e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3054771176363644e+06, - "cpu_time": 5.6353435896226671e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.0755807415774298e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2760286966532863e+02, - "cpu_time": 1.2050653914210720e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2707134525139804e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5037206261591642e-04, - "cpu_time": 2.1383319972600155e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5035935883230926e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 104, - "real_time": 6.7819850429749256e+06, - "cpu_time": 1.1429729798076838e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9475827191269217e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 104, - "real_time": 6.7791265587752257e+06, - "cpu_time": 1.1419085221153963e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9496689151739674e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 104, - "real_time": 6.7812743363901973e+06, - "cpu_time": 1.1429057490384655e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9481012469791441e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 104, - "real_time": 6.7853374281325024e+06, - "cpu_time": 1.1438797586538276e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9451383008427687e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 104, - "real_time": 6.7880927638795516e+06, - "cpu_time": 1.1428053778846156e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9431310335869465e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7831632260304810e+06, - "cpu_time": 1.1428944774999978e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9467244431419497e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7819850429749265e+06, - "cpu_time": 1.1429057490384657e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9475827191269217e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5453561209883846e+03, - "cpu_time": 6.9948469865227507e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5850813162916172e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.2267002913670600e-04, - "cpu_time": 6.1202911766828141e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2258445886864142e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52, - "real_time": 1.3482800863969784e+07, - "cpu_time": 2.2255891057692606e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9773681801780262e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52, - "real_time": 1.3528231513471557e+07, - "cpu_time": 2.2305060230769195e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9606531299506721e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52, - "real_time": 1.3475610194011377e+07, - "cpu_time": 2.2248452653846364e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9800241349978714e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52, - "real_time": 1.3553585481041899e+07, - "cpu_time": 2.2314305865384981e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9513735014154472e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52, - "real_time": 1.3487991805259999e+07, - "cpu_time": 2.2257048403846424e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9754526076913195e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3505643971550923e+07, - "cpu_time": 2.2276151642307915e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9689743108466673e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3487991805259999e+07, - "cpu_time": 2.2257048403846424e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.9754526076913195e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3704672206723655e+04, - "cpu_time": 3.0960096074103443e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2385016454203038e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4955990456820227e-03, - "cpu_time": 1.3898314471563647e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4924694070500731e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27, - "real_time": 2.2060151453371402e+07, - "cpu_time": 4.1530629962962896e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 6.0841707403367720e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27, - "real_time": 2.6069903470299862e+07, - "cpu_time": 4.2372402925926268e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1483784031999788e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27, - "real_time": 2.6175663565044049e+07, - "cpu_time": 4.2445329777777903e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1275769061778183e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27, - "real_time": 2.6075118048875421e+07, - "cpu_time": 4.2419741370370850e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1473488153887224e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27, - "real_time": 2.6072201905427154e+07, - "cpu_time": 4.2397978666666925e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1479245399699602e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5290607688603576e+07, - "cpu_time": 4.2233216540740967e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.3310798810146503e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6072201905427154e+07, - "cpu_time": 4.2397978666666925e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.1479245399699602e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8064342869785707e+06, - "cpu_time": 3.9367843623634643e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2108256808697420e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1427081121209435e-02, - "cpu_time": 9.3215357124546289e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8986355013466930e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 16, - "real_time": 5.1166998222470284e+07, - "cpu_time": 8.2126040749999523e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2462615616586046e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 16, - "real_time": 5.1072767702862620e+07, - "cpu_time": 8.2022782562498614e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2559410439969997e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 16, - "real_time": 5.1108367741107941e+07, - "cpu_time": 8.2091528375000775e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2522799663603735e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 16, - "real_time": 4.2692180024459958e+07, - "cpu_time": 8.0069442124999672e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.2876961505878410e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 16, - "real_time": 5.1081407582387328e+07, - "cpu_time": 8.2030016750000104e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2550520571902857e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9424344254657634e+07, - "cpu_time": 8.1667962112499744e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.4594461559588213e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1081407582387328e+07, - "cpu_time": 8.2030016750000089e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2550520571902857e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7635744948618300e+06, - "cpu_time": 8.9463563526848820e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6302128276372194e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.6148192790785690e-02, - "cpu_time": 1.0954548296871966e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4811035686898045e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 9.4352710992097855e+07, - "cpu_time": 1.5206052137499881e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6900422505609140e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0054269246757030e+08, - "cpu_time": 1.5827201974999738e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3397308031428127e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 9.3814225867390633e+07, - "cpu_time": 1.5154686512499893e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7227025756081381e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0046921670436859e+08, - "cpu_time": 1.5813101150000009e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3436358877938366e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 9.3780806288123131e+07, - "cpu_time": 1.5166469637499702e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7247419088141499e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6591930463910118e+07, - "cpu_time": 1.5433502282499844e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.5641706851839714e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4352710992097855e+07, - "cpu_time": 1.5206052137499881e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6900422505609140e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5802944990661601e+06, - "cpu_time": 3.5350848067585630e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0357307448462942e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7066186397463861e-02, - "cpu_time": 2.2905266361783739e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6586417995173086e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7772912979125977e+08, - "cpu_time": 2.8911530974999523e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0414509723931799e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7718904837965965e+08, - "cpu_time": 2.8867892600000286e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0598656283728867e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7743757367134094e+08, - "cpu_time": 2.8902589950000387e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0513779679429131e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7765997350215912e+08, - "cpu_time": 2.8935291049999988e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0438026801065054e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7769000679254532e+08, - "cpu_time": 2.8923193600000727e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0427811523109636e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7754114642739296e+08, - "cpu_time": 2.8908099635000187e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0478556802252903e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7765997350215912e+08, - "cpu_time": 2.8911530974999523e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0438026801065054e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2711086395882582e+05, - "cpu_time": 2.5621949650587747e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7434374017124977e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2792012923703005e-03, - "cpu_time": 8.8632424732500343e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2803608106971304e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8584787737374504e+06, - "cpu_time": 2.0681499340369406e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2039530705873142e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8538442486559232e+06, - "cpu_time": 2.0683672796833452e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2094628515689429e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8541275399278158e+06, - "cpu_time": 2.0689565092347863e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2091252687824615e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8590964044766480e+06, - "cpu_time": 2.0687736358837958e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2032208712452757e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8537763201428570e+06, - "cpu_time": 2.0684438364117155e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2095438136162786e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8558646573881388e+06, - "cpu_time": 2.0685382390501169e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2070611751600550e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8541275399278160e+06, - "cpu_time": 2.0684438364117157e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2091252687824615e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6804185538205156e+03, - "cpu_time": 3.2375969580315467e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1859172127235393e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4442963516492721e-03, - "cpu_time": 1.5651617634674560e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4435110583160423e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8578662111922745e+06, - "cpu_time": 2.0690574432718842e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4093594849022161e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8534626635929537e+06, - "cpu_time": 2.0699982295514739e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4198354576615728e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8580165038334997e+06, - "cpu_time": 2.0688475751978515e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4090028173044156e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8631745187455413e+06, - "cpu_time": 2.0741065461740405e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.3967969278130746e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8537704078801586e+06, - "cpu_time": 2.0697280633245078e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4191017211067649e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8572580610488858e+06, - "cpu_time": 2.0703475715039517e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4108192817576090e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8578662111922745e+06, - "cpu_time": 2.0697280633245080e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4093594849022161e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9534263683888116e+03, - "cpu_time": 2.1534937038746893e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3801277924313890e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1286359991115698e-03, - "cpu_time": 1.0401604704036909e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1266180256411743e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8598243468923317e+06, - "cpu_time": 2.0726901160949848e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8094340884271134e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8547937996353153e+06, - "cpu_time": 2.0724264564643570e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8333269192626048e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8596879644422315e+06, - "cpu_time": 2.0720068548811623e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8100801388548985e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8636643150753751e+06, - "cpu_time": 2.0767091319260958e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7912827795585897e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8542272212958434e+06, - "cpu_time": 2.0723761187335397e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8360260338265859e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8584395294682193e+06, - "cpu_time": 2.0732417356200286e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8160299919859599e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8596879644422315e+06, - "cpu_time": 2.0724264564643570e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8100801388548985e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9309534459480137e+03, - "cpu_time": 1.9535880050969558e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8643742927106436e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1151903968986445e-03, - "cpu_time": 9.4228664778095016e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1147549343700244e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8649235953393308e+06, - "cpu_time": 2.0793030529100560e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7570693020288438e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8592122597852412e+06, - "cpu_time": 2.0799521825395497e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7624668634545822e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8638760258293359e+06, - "cpu_time": 2.0790380317459684e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7580568420809962e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8684129451189644e+06, - "cpu_time": 2.0833485052909204e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7537878917828638e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8620164956946464e+06, - "cpu_time": 2.0771524867725067e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7598125513799772e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8636882643535037e+06, - "cpu_time": 2.0797588518518005e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7582386901454527e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8638760258293361e+06, - "cpu_time": 2.0793030529100560e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7580568420809962e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4173576303641212e+03, - "cpu_time": 2.2607223288513101e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2235319164553421e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8336530286354360e-03, - "cpu_time": 1.0870117594827791e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8333869767071676e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 373, - "real_time": 1.8631497094262238e+06, - "cpu_time": 2.0841250697050730e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5174843797271930e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 373, - "real_time": 1.8583797352413782e+06, - "cpu_time": 2.0844219517426065e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5265128411168218e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 373, - "real_time": 1.8637386820046231e+06, - "cpu_time": 2.0840886461125186e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5163727958637409e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 373, - "real_time": 1.8683675662032329e+06, - "cpu_time": 2.0895920589813108e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5076609755744003e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 373, - "real_time": 1.8625787971790968e+06, - "cpu_time": 2.0833736863270456e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5185625488304302e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8632428980109110e+06, - "cpu_time": 2.0851202825737111e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5173187082225181e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8631497094262238e+06, - "cpu_time": 2.0841250697050733e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5174843797271930e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5569682313689545e+03, - "cpu_time": 2.5293166605767956e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7132930860625318e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9090201471671597e-03, - "cpu_time": 1.2130315367009919e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9086394048877940e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 374, - "real_time": 1.8620722242590552e+06, - "cpu_time": 2.0974661871657632e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0390395330747917e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 374, - "real_time": 1.8659045223385112e+06, - "cpu_time": 2.1020039278073576e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0245823637175903e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 374, - "real_time": 1.8574399007113904e+06, - "cpu_time": 2.0968358877006173e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0565943990866169e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 374, - "real_time": 1.8622664210463148e+06, - "cpu_time": 2.0976107112299232e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0383055033746019e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 374, - "real_time": 1.8580696193571698e+06, - "cpu_time": 2.0968186898395997e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0542028476493001e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8611505375424884e+06, - "cpu_time": 2.0981470807486521e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0425449293805808e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8620722242590550e+06, - "cpu_time": 2.0974661871657632e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0390395330747917e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4625119637631310e+03, - "cpu_time": 2.1857737292887223e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3097795221429445e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8604147778046598e-03, - "cpu_time": 1.0417638254934937e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8598099625587261e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8632719163501405e+06, - "cpu_time": 2.1213788068782301e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4069014710075128e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8626099278215349e+06, - "cpu_time": 2.1213662486771950e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4074014966010490e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8624405988101556e+06, - "cpu_time": 2.1210991322752149e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4075294544560191e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8621527560368776e+06, - "cpu_time": 2.1207425608466147e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4077470237076971e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8616101074570830e+06, - "cpu_time": 2.1200421481482587e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4081573738234735e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8624170612951580e+06, - "cpu_time": 2.1209257793651028e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4075473639191505e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8624405988101556e+06, - "cpu_time": 2.1210991322752149e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4075294544560191e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1023774971939963e+02, - "cpu_time": 5.5760010913291501e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6118103549473934e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2765902031365056e-04, - "cpu_time": 2.6290411223151434e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2764867976494577e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8943431925670726e+06, - "cpu_time": 2.1887299973118557e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7676505611927903e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8956631879567581e+06, - "cpu_time": 2.1871740161289317e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7657233802440625e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8973913543196695e+06, - "cpu_time": 2.1891521370968525e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7632043268584895e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8929414571918827e+06, - "cpu_time": 2.1876962876345161e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7697000243090677e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8914356637309226e+06, - "cpu_time": 2.1862199408602887e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7719050140242344e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8943549711532616e+06, - "cpu_time": 2.1877944758064887e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7676366613257289e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8943431925670723e+06, - "cpu_time": 2.1876962876345157e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7676505611927903e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3157919928368551e+03, - "cpu_time": 1.1823933452441490e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3831467635915533e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2224699320355088e-03, - "cpu_time": 5.4044991808852700e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2223955589499194e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 373, - "real_time": 1.8888921616567753e+06, - "cpu_time": 2.2673993083109008e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5512750875109696e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 373, - "real_time": 1.8914024232126442e+06, - "cpu_time": 2.2685671769436486e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5439074579324043e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 373, - "real_time": 1.8887180192383560e+06, - "cpu_time": 2.2672047024128679e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5517869227659965e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 373, - "real_time": 1.8894155086867071e+06, - "cpu_time": 2.2659012412867285e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5497374462054825e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 373, - "real_time": 1.8893039936540604e+06, - "cpu_time": 2.2664420643431535e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5500650161225390e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8895464212897089e+06, - "cpu_time": 2.2671028986594598e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5493543861074793e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8893039936540604e+06, - "cpu_time": 2.2672047024128679e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5500650161225390e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0764476332216750e+03, - "cpu_time": 1.0152605592671423e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1593941292595956e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.6968573044474159e-04, - "cpu_time": 4.4782288438141333e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6932643140776432e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 364, - "real_time": 1.9354302766169985e+06, - "cpu_time": 2.4703439780220115e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0835585375184274e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 364, - "real_time": 1.9352927130447435e+06, - "cpu_time": 2.4694505439559999e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0836355585200379e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 364, - "real_time": 1.9346689583111943e+06, - "cpu_time": 2.4697988626372875e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0839849324044771e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 364, - "real_time": 1.9340197124600329e+06, - "cpu_time": 2.4700066978021800e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0843488235869460e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 364, - "real_time": 1.9357617156756632e+06, - "cpu_time": 2.4710101978021506e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0833730117800190e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9350346752217268e+06, - "cpu_time": 2.4701220560439257e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0837801727619815e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9352927130447433e+06, - "cpu_time": 2.4700066978021795e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0836355585200379e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9202060482630736e+02, - "cpu_time": 5.9302932667800303e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8765506440649013e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5762697882765949e-04, - "cpu_time": 2.4008098111061814e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5768790954955631e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 344, - "real_time": 2.0317115403338186e+06, - "cpu_time": 2.8874096482558195e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0644190460772099e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 344, - "real_time": 2.0318385203461009e+06, - "cpu_time": 2.8865069331395598e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0642900299407392e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 344, - "real_time": 2.0305585247453649e+06, - "cpu_time": 2.8857650494186333e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0655912887445447e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 344, - "real_time": 2.0300031766203386e+06, - "cpu_time": 2.8862562034883169e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0661563727121401e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 344, - "real_time": 2.0282682857806468e+06, - "cpu_time": 2.8856518720929306e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0679236713429563e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0304760095652540e+06, - "cpu_time": 2.8863179412790518e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0656760817635183e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0305585247453649e+06, - "cpu_time": 2.8862562034883173e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0655912887445447e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4566567857917748e+03, - "cpu_time": 7.0368515156399121e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4824647159106352e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1739669857200637e-04, - "cpu_time": 2.4380029015519955e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1766562482778937e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 337, - "real_time": 2.0770264726590905e+06, - "cpu_time": 3.6424380326410378e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0387583453669586e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 337, - "real_time": 2.0782841899423953e+06, - "cpu_time": 3.6422785608308478e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0363142060145831e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 337, - "real_time": 2.0729624182649110e+06, - "cpu_time": 3.6424999881305816e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0466763536510916e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 337, - "real_time": 2.0772021330163458e+06, - "cpu_time": 3.6450767181008817e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0384168043476534e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 337, - "real_time": 2.0805212792744227e+06, - "cpu_time": 3.6433564569733115e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0319741420407438e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0771992986314329e+06, - "cpu_time": 3.6431299513353324e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0384279702842064e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0772021330163456e+06, - "cpu_time": 3.6424999881305820e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0384168043476534e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7474341047905868e+03, - "cpu_time": 1.1663700701148286e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3447403800895698e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3226627346739138e-03, - "cpu_time": 3.2015604320875622e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3234705235347880e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 189, - "real_time": 3.7013458607905600e+06, - "cpu_time": 6.8072491428569425e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5327339381401672e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 189, - "real_time": 3.7068934303033287e+06, - "cpu_time": 6.8089752962964904e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5259504529719238e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 189, - "real_time": 3.7079922788377320e+06, - "cpu_time": 6.8133620952381827e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5246092058365364e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 189, - "real_time": 3.7050131713311193e+06, - "cpu_time": 6.7998078253967874e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5282473298124237e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 189, - "real_time": 3.7009827669453686e+06, - "cpu_time": 6.7964216878308635e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5331786329411068e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7044455016416223e+06, - "cpu_time": 6.8051632095238538e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5289439119404316e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7050131713311188e+06, - "cpu_time": 6.8072491428569434e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5282473298124237e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1816873297865886e+03, - "cpu_time": 6.9137397806147319e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8901433394259396e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.5888355716844187e-04, - "cpu_time": 1.0159550282260572e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5895153816537397e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 95, - "real_time": 7.5182302511836356e+06, - "cpu_time": 1.3941376136842553e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4630758674512987e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 95, - "real_time": 7.5192625732406192e+06, - "cpu_time": 1.3943871778947499e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4624631302825823e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 95, - "real_time": 7.5243641034160787e+06, - "cpu_time": 1.3948730052631594e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4594375735706635e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 95, - "real_time": 7.5245157227312261e+06, - "cpu_time": 1.3937407968421068e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4593477157119303e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 95, - "real_time": 7.5229561544562643e+06, - "cpu_time": 1.3933047147368502e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4602721737416811e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5218657610055655e+06, - "cpu_time": 1.3940886616842244e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4609192921516314e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5229561544562634e+06, - "cpu_time": 1.3941376136842553e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4602721737416811e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9345565258432589e+03, - "cpu_time": 6.0047602786422967e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7405715938392193e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.9013678508548004e-04, - "cpu_time": 4.3073015681713062e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9018226509982229e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 48, - "real_time": 1.4020963921211660e+07, - "cpu_time": 2.5905443437500492e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7863231356350718e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 48, - "real_time": 1.4682143072908124e+07, - "cpu_time": 2.7087393875000030e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5707812317829161e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 48, - "real_time": 1.4732850172246495e+07, - "cpu_time": 2.7148618749999780e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5550496486021824e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 48, - "real_time": 1.4725653377051154e+07, - "cpu_time": 2.7149862104166072e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5572758153186073e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 48, - "real_time": 1.4715023299989602e+07, - "cpu_time": 2.7134790291666400e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5605679740953875e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4575326768681407e+07, - "cpu_time": 2.6885221691666555e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6059995610868330e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4715023299989602e+07, - "cpu_time": 2.7134790291666400e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5605679740953875e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1050552419302322e+05, - "cpu_time": 5.4830102667761955e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0098372187791535e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1303503456280581e-02, - "cpu_time": 2.0394141918032724e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1924388080941805e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.8413940295577049e+07, - "cpu_time": 5.1241220520000756e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7236577047672796e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.8384627923369408e+07, - "cpu_time": 5.1223832319999479e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7285357540127172e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8419796675443649e+07, - "cpu_time": 5.1314089239999704e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7226843151897669e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.5732265785336494e+07, - "cpu_time": 4.8830315239999898e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.2159312016932392e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.8364084139466286e+07, - "cpu_time": 5.1185832559999660e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7319605787393322e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7862942963838577e+07, - "cpu_time": 5.0759057975999899e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8245539108804674e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8384627923369408e+07, - "cpu_time": 5.1223832319999471e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7285357540127172e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1912983494502562e+06, - "cpu_time": 1.0792058076325529e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1881879164244372e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2755654023925657e-02, - "cpu_time": 2.1261344293324498e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5355238159730693e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.5166532099246979e+07, - "cpu_time": 9.5859054400000334e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8659113738937407e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.5307603627443314e+07, - "cpu_time": 9.5938668899998456e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8535000324404564e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.2567259967327118e+07, - "cpu_time": 9.2994377800005168e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.1065141338324375e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.5148562788963318e+07, - "cpu_time": 9.5761200800001234e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8674968562140121e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.5126883462071419e+07, - "cpu_time": 9.5581788200001940e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8694110593915558e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4663368389010444e+07, - "cpu_time": 9.5227018020001441e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9125666911544409e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5148562788963318e+07, - "cpu_time": 9.5761200800001234e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8674968562140121e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1738976856912039e+06, - "cpu_time": 1.2551705497316974e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0859891562082855e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1475033835039063e-02, - "cpu_time": 1.3180823844216797e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2106349378700867e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0772499628365040e+08, - "cpu_time": 1.8389215724999985e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9837171549894199e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 9.8221935331821442e+07, - "cpu_time": 1.7470415225000125e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4658962907450199e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0784747824072838e+08, - "cpu_time": 1.8433919000000286e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9780571670080252e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 9.8238898441195488e+07, - "cpu_time": 1.7494883512500080e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4649524833726006e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0750733315944672e+08, - "cpu_time": 1.8381612712499872e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9938073638544617e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0390812829136848e+08, - "cpu_time": 1.8034009235000068e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1772860919939060e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0750733315944672e+08, - "cpu_time": 1.8381612712499875e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9938073638544617e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1844525372433672e+06, - "cpu_time": 5.0379122685382264e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6309377660624054e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9894581131378464e-02, - "cpu_time": 2.7935619877363378e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0816928392867000e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.9372923299670219e+08, - "cpu_time": 3.1309286350000322e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5424873540808268e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.9393130391836166e+08, - "cpu_time": 3.1182908949999446e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5367122393608408e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.9423726946115494e+08, - "cpu_time": 3.1378722150000727e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5279907248425112e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.9410534948110580e+08, - "cpu_time": 3.1333693674999094e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5317477177748671e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.9406627118587494e+08, - "cpu_time": 3.1344527999999624e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5328616221598845e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9401388540863994e+08, - "cpu_time": 3.1309827824999845e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5343599316437874e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9406627118587494e+08, - "cpu_time": 3.1333693674999100e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5328616221598845e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9291000444967538e+05, - "cpu_time": 7.5214365289334487e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5050825349380551e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.9431029920028931e-04, - "cpu_time": 2.4022605844315230e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9470988568373868e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8537589148955273e+06, - "cpu_time": 2.0660827131579434e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2095645593865365e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8493217583837626e+06, - "cpu_time": 2.0662566736841896e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2148660618040580e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8540018368137106e+06, - "cpu_time": 2.0658586078947170e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2092750496080359e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8583563830026451e+06, - "cpu_time": 2.0707554052630952e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2040982222052994e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8492572971904576e+06, - "cpu_time": 2.0667823710525860e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2149432673446671e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8529392380572204e+06, - "cpu_time": 2.0671471542105065e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2105494320697193e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8537589148955271e+06, - "cpu_time": 2.0662566736841896e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2095645593865365e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8009634741723939e+03, - "cpu_time": 2.0456590832704194e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5318653518054280e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0513157669204782e-03, - "cpu_time": 9.8960496310273888e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0501081251832853e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8536025913099844e+06, - "cpu_time": 2.0669739921053657e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4195018060535416e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8491599716454449e+06, - "cpu_time": 2.0674041394736259e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4301196898127105e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8544006895114619e+06, - "cpu_time": 2.0677960631578690e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4175997379283579e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8579019931501918e+06, - "cpu_time": 2.0717456052630879e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4092745635683071e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8540981285408826e+06, - "cpu_time": 2.0673977578947020e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4183206238640929e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8538326748315929e+06, - "cpu_time": 2.0682635115789298e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4189632842454016e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8540981285408824e+06, - "cpu_time": 2.0674041394736257e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4183206238640929e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1160692955870454e+03, - "cpu_time": 1.9681460049311838e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4313351797446830e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6808794762828943e-03, - "cpu_time": 9.5159344731111386e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6816919946447768e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8552583452471115e+06, - "cpu_time": 2.0702489707448264e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8311151069463212e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8520032796933518e+06, - "cpu_time": 2.0717846436170968e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8466366013740581e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8572147936673842e+06, - "cpu_time": 2.0715562632979206e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8218121328050736e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8620535573527960e+06, - "cpu_time": 2.0763282500001455e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.7988876234539952e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8569033136760057e+06, - "cpu_time": 2.0715255132979276e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8232919179650396e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8566866579273299e+06, - "cpu_time": 2.0722887281915832e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8243486765088979e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8569033136760057e+06, - "cpu_time": 2.0715562632979203e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8232919179650396e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6436103424936687e+03, - "cpu_time": 2.3372767238280776e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7308611952286752e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9624260921663169e-03, - "cpu_time": 1.1278721406103194e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9614605663037343e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 375, - "real_time": 1.8597307271556926e+06, - "cpu_time": 2.0769743999999263e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7619755119127378e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 375, - "real_time": 1.8560639371668608e+06, - "cpu_time": 2.0776317680000223e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7654564233394802e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 375, - "real_time": 1.8606267278664745e+06, - "cpu_time": 2.0772982080000779e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7611270175385524e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 375, - "real_time": 1.8657702140044423e+06, - "cpu_time": 2.0827778266666429e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7562720078841385e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 375, - "real_time": 1.8593578267997750e+06, - "cpu_time": 2.0768149813334274e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7623288819236308e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8603098865986492e+06, - "cpu_time": 2.0782994368000198e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7614319685197081e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8597307271556929e+06, - "cpu_time": 2.0772982080000781e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7619755119127378e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5066185228974159e+03, - "cpu_time": 2.5230709010635833e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3171643962925998e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8849647298863966e-03, - "cpu_time": 1.2140074025850591e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8832202750812541e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8564926668374042e+06, - "cpu_time": 2.0847415145118490e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5300974343002774e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8568342025723495e+06, - "cpu_time": 2.0849925672823065e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5294481278517090e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8609663583157035e+06, - "cpu_time": 2.0842011345645655e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5216112159767561e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8679274393036400e+06, - "cpu_time": 2.0914431424802805e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5084874616131611e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8606969963751198e+06, - "cpu_time": 2.0843719287598401e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5221210185039625e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8605835326808435e+06, - "cpu_time": 2.0859500575197686e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5223530516491733e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8606969963751198e+06, - "cpu_time": 2.0847415145118490e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5221210185039625e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6066542515263154e+03, - "cpu_time": 3.0862828785822080e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7059507744702991e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4759190708781363e-03, - "cpu_time": 1.4795574167541926e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4716292338708506e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8567763493024057e+06, - "cpu_time": 2.0990176174142361e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0591161961559877e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8652812882644765e+06, - "cpu_time": 2.1038509630607893e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0269294408648685e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8576168831306358e+06, - "cpu_time": 2.0987151767810420e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0559220897639975e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8625287688106892e+06, - "cpu_time": 2.0995097255936619e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0373141180361763e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8581935640124695e+06, - "cpu_time": 2.0993299208443491e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0537323203816891e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8600793707041356e+06, - "cpu_time": 2.1000846807388160e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0466028330405444e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8581935640124697e+06, - "cpu_time": 2.0993299208443491e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0537323203816891e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6602445170588339e+03, - "cpu_time": 2.1271626449276328e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3852662002301219e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9677894259282299e-03, - "cpu_time": 1.0128937487317372e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9658638822877893e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8619373587416559e+06, - "cpu_time": 2.1232776111111841e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4079098782204118e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8626671082635222e+06, - "cpu_time": 2.1229460846560868e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4073582919729796e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8626425409733895e+06, - "cpu_time": 2.1229382698412077e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4073768542997381e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8666429570186194e+06, - "cpu_time": 2.1275644629630428e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4043606947666809e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8617731113514677e+06, - "cpu_time": 2.1224437962963469e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4080340853655833e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8631326152697310e+06, - "cpu_time": 2.1238340449735736e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4070079609250790e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8626425409733895e+06, - "cpu_time": 2.1229460846560863e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4073768542997381e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0035130305030302e+03, - "cpu_time": 2.1064967965250898e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5110607572165984e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0753464429116744e-03, - "cpu_time": 9.9183681583336751e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0739532392006559e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8937612504457994e+06, - "cpu_time": 2.1918054489246886e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7685010445565951e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8902137453551404e+06, - "cpu_time": 2.1879094811827792e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7736968969162524e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8911814195528296e+06, - "cpu_time": 2.1882802580645122e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7722776597708327e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8900717639612155e+06, - "cpu_time": 2.1879663629032555e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7739052558575678e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8942859933695316e+06, - "cpu_time": 2.1921322715053475e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7677341322014594e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8919028345369033e+06, - "cpu_time": 2.1896187645161166e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7712229978605413e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8911814195528298e+06, - "cpu_time": 2.1882802580645117e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7722776597708327e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9911954327784679e+03, - "cpu_time": 2.1530783897929423e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9158279109028366e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0524829269394638e-03, - "cpu_time": 9.8331199233614116e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0521809010512449e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 373, - "real_time": 1.8894862804634261e+06, - "cpu_time": 2.2721266702413126e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5495295776522934e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 373, - "real_time": 1.8944073019483082e+06, - "cpu_time": 2.2725137560320981e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5351138000871778e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 373, - "real_time": 1.8899058120234073e+06, - "cpu_time": 2.2716485898123863e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5482976629261398e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 373, - "real_time": 1.8940388195212909e+06, - "cpu_time": 2.2730954879355780e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5361906482203066e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 373, - "real_time": 1.8908469835527232e+06, - "cpu_time": 2.2727305415550787e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5455359905952024e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8917370395018314e+06, - "cpu_time": 2.2724230091152908e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5429335358962238e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8908469835527230e+06, - "cpu_time": 2.2725137560320981e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5455359905952024e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3259408153047311e+03, - "cpu_time": 5.5735557721405826e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8130242635704740e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2295264969370387e-03, - "cpu_time": 2.4526928964297464e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2291369217128619e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 363, - "real_time": 1.9358205172866993e+06, - "cpu_time": 2.4725975426997878e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0833401037299819e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 363, - "real_time": 1.9336964479024129e+06, - "cpu_time": 2.4709552837465438e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0845300989588599e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 363, - "real_time": 1.9346150011914594e+06, - "cpu_time": 2.4711756143250829e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0840151651405783e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 363, - "real_time": 1.9350681212132915e+06, - "cpu_time": 2.4727461680440959e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0837613296451194e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 363, - "real_time": 1.9360409165057801e+06, - "cpu_time": 2.4717076088154749e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0832167761128714e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9350482008199287e+06, - "cpu_time": 2.4718364435261972e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0837726947174823e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9350681212132915e+06, - "cpu_time": 2.4717076088154754e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0837613296451194e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4832112773509630e+02, - "cpu_time": 8.1188158329860994e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3121622535461024e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9007623031471184e-04, - "cpu_time": 3.2845279283139810e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9015464953477863e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 345, - "real_time": 2.0341536794465196e+06, - "cpu_time": 2.8890419478260730e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0619405713442671e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 345, - "real_time": 2.0321436990659845e+06, - "cpu_time": 2.8870881420289152e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0639800236212573e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 345, - "real_time": 2.0309564640637543e+06, - "cpu_time": 2.8865827304348778e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0651865631858940e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 345, - "real_time": 2.0295377798796890e+06, - "cpu_time": 2.8878096956522432e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0666301665242412e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 345, - "real_time": 2.0346197687710326e+06, - "cpu_time": 2.8872689449276486e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0614682233887255e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0322822782453964e+06, - "cpu_time": 2.8875582921739514e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0638411096128774e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0321436990659847e+06, - "cpu_time": 2.8872689449276486e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0639800236212573e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1374788372068588e+03, - "cpu_time": 9.3820593411470600e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1708878145496142e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0517627694181764e-03, - "cpu_time": 3.2491324474989572e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0518677065003400e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 337, - "real_time": 2.0814954395784556e+06, - "cpu_time": 3.6496735964392726e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0300871385521078e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 337, - "real_time": 2.0728957831019463e+06, - "cpu_time": 3.6469538338279747e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0468064378263259e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 337, - "real_time": 2.0820409980483728e+06, - "cpu_time": 3.6466020801187572e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0290311323663492e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 337, - "real_time": 2.0748831702048064e+06, - "cpu_time": 3.6465603353115134e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0429302817912307e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 337, - "real_time": 2.0752450142426067e+06, - "cpu_time": 3.6471784094955944e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0422253480568190e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0773120810352378e+06, - "cpu_time": 3.6473936510386220e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0382160677185664e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0752450142426069e+06, - "cpu_time": 3.6469538338279747e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0422253480568190e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1695085201062839e+03, - "cpu_time": 1.2998960298874031e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1014679005720932e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0071652007282365e-03, - "cpu_time": 3.5639038564352601e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0061997091574907e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 189, - "real_time": 3.6969183692856440e+06, - "cpu_time": 6.8005900264549712e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5381624164024649e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 189, - "real_time": 3.5593321327632540e+06, - "cpu_time": 6.8502048835977716e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.7135854070957870e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 189, - "real_time": 3.6924239987182240e+06, - "cpu_time": 6.7894136137566883e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5436862087950869e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 189, - "real_time": 3.6963299483494470e+06, - "cpu_time": 6.7970770317460680e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5388848491438570e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 189, - "real_time": 3.6939553960803011e+06, - "cpu_time": 6.7932117407407435e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5418025398472595e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6677919690393740e+06, - "cpu_time": 6.8060994592592493e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5752242842568913e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6939553960803011e+06, - "cpu_time": 6.7970770317460671e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5418025398472595e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.0657978329491962e+04, - "cpu_time": 2.5007784952243703e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7378291706475914e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6538009473143267e-02, - "cpu_time": 3.6743196454795063e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6912458690327072e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 95, - "real_time": 7.5076852434952008e+06, - "cpu_time": 1.3941601515789084e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4693445331997890e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 95, - "real_time": 7.5224137178769233e+06, - "cpu_time": 1.3939104821052920e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4605938011968555e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 95, - "real_time": 7.5168810735799763e+06, - "cpu_time": 1.3943381705263093e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4638769286819944e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 95, - "real_time": 7.5229929858132415e+06, - "cpu_time": 1.3942468305263469e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4602503369704714e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 95, - "real_time": 7.5131353775137346e+06, - "cpu_time": 1.3937591136842504e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4661024078477230e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5166216796558155e+06, - "cpu_time": 1.3940829496842215e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4640336015793676e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5168810735799763e+06, - "cpu_time": 1.3941601515789086e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4638769286819944e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4463696756315640e+03, - "cpu_time": 2.4112733140080281e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8293543247706918e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.5761528920353248e-04, - "cpu_time": 1.7296483789248077e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5782381284403250e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 48, - "real_time": 1.4701629639603198e+07, - "cpu_time": 2.7085812145833421e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5647227991121731e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 48, - "real_time": 1.4686109730973840e+07, - "cpu_time": 2.7088345874999460e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5695466824998312e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 48, - "real_time": 1.4702882986360541e+07, - "cpu_time": 2.7128969583333883e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5643336794732742e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 48, - "real_time": 1.4692206265560040e+07, - "cpu_time": 2.7051310083333392e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5676505479854107e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 48, - "real_time": 1.4662789568925897e+07, - "cpu_time": 2.7044841937499344e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5768142333720999e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4689123638284704e+07, - "cpu_time": 2.7079855924999900e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5686135884885578e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4692206265560042e+07, - "cpu_time": 2.7085812145833425e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5676505479854107e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6261835425504201e+04, - "cpu_time": 3.3765928274303435e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0622265634007333e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1070664136232395e-03, - "cpu_time": 1.2469020650560775e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1080443695557711e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.6999604105949402e+07, - "cpu_time": 4.9967930839998186e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9710998529206190e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.8340256065130234e+07, - "cpu_time": 5.1083491759998195e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7359391422415934e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8328038081526756e+07, - "cpu_time": 5.1020464680000260e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7379817696420670e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.8411948829889297e+07, - "cpu_time": 5.1134010199998558e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7239887979385386e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.8396064192056656e+07, - "cpu_time": 5.1183771519999936e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7266313772295694e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8095182254910477e+07, - "cpu_time": 5.0877933799999028e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7791281879944773e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8340256065130241e+07, - "cpu_time": 5.1083491759998202e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7359391422415934e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1348298510445107e+05, - "cpu_time": 5.1229540977157111e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0747989233691667e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1835878462658009e-02, - "cpu_time": 1.0069107990615391e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2489434915538380e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.0316881388425827e+07, - "cpu_time": 9.1693882499998838e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3348985190037441e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.5149123072624207e+07, - "cpu_time": 9.5626295699997857e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8674474052199430e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.5211555957794189e+07, - "cpu_time": 9.5822959800000265e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8619433258718929e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.5132771283388138e+07, - "cpu_time": 9.5681858000000373e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8688910379674921e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.0012272223830223e+07, - "cpu_time": 9.1286271699999586e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3673917233477316e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3164520785212524e+07, - "cpu_time": 9.4022253539999396e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0601144022821608e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5132771283388138e+07, - "cpu_time": 9.5626295699997857e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8688910379674921e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7408361127319322e+06, - "cpu_time": 2.3171474693160695e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6593438344171444e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.1553857201216108e-02, - "cpu_time": 2.4644670618645590e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2555014037187667e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 9.5046305097639561e+07, - "cpu_time": 1.8012250099999961e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6485195447469635e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0783355310559273e+08, - "cpu_time": 1.8340230550000313e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9787000106941252e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 9.4974483363330364e+07, - "cpu_time": 1.7999204125000289e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6527910759584694e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0786197148263454e+08, - "cpu_time": 1.8385654562499100e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9773882733678255e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 9.5071386545896530e+07, - "cpu_time": 1.8028767475000507e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6470293692500315e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0015753991901875e+08, - "cpu_time": 1.8153221362500036e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.3808856548034830e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5071386545896530e+07, - "cpu_time": 1.8028767475000507e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6470293692500315e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0202777180208210e+06, - "cpu_time": 1.9240621422039159e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6774867878493148e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.0092353742883320e-02, - "cpu_time": 1.0599012174106696e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8343522307827628e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7986493557691574e+08, - "cpu_time": 3.1871025724998957e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9697117759833469e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8023148924112320e+08, - "cpu_time": 3.2264847699997288e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9575706138869638e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7977836728096008e+08, - "cpu_time": 3.2172579575001234e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9725863586353617e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8014448881149292e+08, - "cpu_time": 3.2239760400000250e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9604478109990177e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8008193373680115e+08, - "cpu_time": 3.2149539849999088e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9625182921976395e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8002024292945862e+08, - "cpu_time": 3.2139550649999368e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9645669703404665e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8008193373680115e+08, - "cpu_time": 3.2172579575001234e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9625182921976395e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9137136816232878e+05, - "cpu_time": 1.5735125840236386e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3421836366727827e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0630547156706045e-03, - "cpu_time": 4.8958761158774001e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0633099885054625e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8480922752758183e+06, - "cpu_time": 2.0696343543304799e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2163395490567121e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8468097289929441e+06, - "cpu_time": 2.0657908897638493e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2178787211791049e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8496372757386051e+06, - "cpu_time": 2.0681680813648563e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2144882424930413e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8469693242586611e+06, - "cpu_time": 2.0655158608922868e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2176870759042292e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8425821139140476e+06, - "cpu_time": 2.0657112414698419e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2229674157094685e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8468181436360155e+06, - "cpu_time": 2.0669640855642627e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2178722008685111e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8469693242586609e+06, - "cpu_time": 2.0657908897638493e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2176870759042292e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6238231379684366e+03, - "cpu_time": 1.8454879152341225e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1541926029591946e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4207263162374255e-03, - "cpu_time": 8.9284953140843790e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4221705839155311e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8437452347001673e+06, - "cpu_time": 2.0674568848169118e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4431301276459685e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8488204246912582e+06, - "cpu_time": 2.0691145000000093e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4309333078511469e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8504321724417161e+06, - "cpu_time": 2.0700248455498491e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4270739138686405e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8471266099672972e+06, - "cpu_time": 2.0664947905759318e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4349964727891805e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8444091102723349e+06, - "cpu_time": 2.0682013455495902e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4415308699003421e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8469067104145549e+06, - "cpu_time": 2.0682584732984588e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4355329384110561e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8471266099672974e+06, - "cpu_time": 2.0682013455495904e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4349964727891805e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8448407606427027e+03, - "cpu_time": 1.3792422794761083e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8317633019926216e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5403272642851315e-03, - "cpu_time": 6.6686166032067199e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5402350510872248e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8451983781369205e+06, - "cpu_time": 2.0705319133859547e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8792620859242082e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8482409171889026e+06, - "cpu_time": 2.0697228871392573e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8646452135251835e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8519730093428167e+06, - "cpu_time": 2.0732410419947365e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8467811989408843e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8498972075101566e+06, - "cpu_time": 2.0716325065616197e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8567083260003496e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8461835754919478e+06, - "cpu_time": 2.0716400577428341e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8745237567364872e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8482986175341487e+06, - "cpu_time": 2.0713536813648802e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8643841162254233e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8482409171889026e+06, - "cpu_time": 2.0716325065616197e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8646452135251835e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7452168204448599e+03, - "cpu_time": 1.3282203774022912e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3162588236438578e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4852669338179278e-03, - "cpu_time": 6.4123302039228991e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4848846872898586e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8542003011756795e+06, - "cpu_time": 2.0823200526314466e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7672308638512801e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8534533250395295e+06, - "cpu_time": 2.0768617552631130e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7679430907331396e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8550386246620053e+06, - "cpu_time": 2.0783741473684660e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7664322221846163e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8526423931976559e+06, - "cpu_time": 2.0765228578948395e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7687169483066030e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8486347998412766e+06, - "cpu_time": 2.0763791131580428e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7725512904340789e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8527938887832295e+06, - "cpu_time": 2.0780915852631810e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7685748831019435e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8534533250395295e+06, - "cpu_time": 2.0768617552631130e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7679430907331396e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4886071857148677e+03, - "cpu_time": 2.4932772472075467e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3784734045049780e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3431646125242733e-03, - "cpu_time": 1.1997918017130048e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3448530945623968e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8565472606018088e+06, - "cpu_time": 2.0901602921053621e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5299936279971771e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8607350978479523e+06, - "cpu_time": 2.0897776789474010e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5220488975457154e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8586428605263601e+06, - "cpu_time": 2.0877947184209533e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5260135979776382e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8557160926368516e+06, - "cpu_time": 2.0852103684208752e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5315746983083829e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8563409477983920e+06, - "cpu_time": 2.0896819736842525e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5303859497214273e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8575964518822730e+06, - "cpu_time": 2.0885250063157689e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5280033543100677e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8565472606018085e+06, - "cpu_time": 2.0896819736842525e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5299936279971771e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0711659329261488e+03, - "cpu_time": 2.0677322486277044e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9308756606352996e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1149708704640715e-03, - "cpu_time": 9.9004428597925030e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1141927220202480e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8557904647631906e+06, - "cpu_time": 2.1024784696570435e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0628663358675867e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8612747898065462e+06, - "cpu_time": 2.1041797044856166e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0420553009060591e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8602599161243960e+06, - "cpu_time": 2.1050623113455730e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0458971278094873e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8628431794876822e+06, - "cpu_time": 2.1055027176781143e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0361263601398438e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8582601454366972e+06, - "cpu_time": 2.1042697941953344e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0534795852922767e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8596856991237025e+06, - "cpu_time": 2.1042985994723365e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0480849420030519e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8602599161243960e+06, - "cpu_time": 2.1042697941953344e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0458971278094873e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7399667265774442e+03, - "cpu_time": 1.1576911052460978e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0389207905923338e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4733493556833483e-03, - "cpu_time": 5.5015533704978682e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4740469207470627e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8685159315287187e+06, - "cpu_time": 2.1327632148542753e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4029529830421513e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8715045968532581e+06, - "cpu_time": 2.1331306153846267e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4007125627196860e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8716743537064255e+06, - "cpu_time": 2.1334884482758809e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4005855210917616e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8703638138564487e+06, - "cpu_time": 2.1325571034484990e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4015668933387506e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8701507545178831e+06, - "cpu_time": 2.1318157082228134e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4017265686561167e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8704418900925468e+06, - "cpu_time": 2.1327510180372195e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4015089057696933e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8703638138564485e+06, - "cpu_time": 2.1327632148542753e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4015668933387506e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2696933122825419e+03, - "cpu_time": 6.3254517113249381e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5169590416266903e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7881997243962459e-04, - "cpu_time": 2.9658650530835429e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7905091451417364e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 372, - "real_time": 1.8956940757268439e+06, - "cpu_time": 2.1964512634409764e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7656783165236109e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 372, - "real_time": 1.8968609591504128e+06, - "cpu_time": 2.1973949677419933e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7639769666345179e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 372, - "real_time": 1.8981048476322736e+06, - "cpu_time": 2.1993671075268053e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7621656446112829e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 372, - "real_time": 1.8915448050510378e+06, - "cpu_time": 2.1939706397851082e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7717450762994409e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 372, - "real_time": 1.8917659020786155e+06, - "cpu_time": 2.1941193333333638e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7714211331535691e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8947941179278367e+06, - "cpu_time": 2.1962606623656498e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7669974274444842e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8956940757268439e+06, - "cpu_time": 2.1964512634409764e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7656783165236109e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9904353051137341e+03, - "cpu_time": 2.2804863754846997e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3680288554449822e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5782375915247722e-03, - "cpu_time": 1.0383495978242986e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5786168834566509e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 369, - "real_time": 1.9034304827083217e+06, - "cpu_time": 2.2815761165313064e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5088746845538568e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 369, - "real_time": 1.9043441312917606e+06, - "cpu_time": 2.2805841788617615e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5062316876977837e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 369, - "real_time": 1.9019887822700366e+06, - "cpu_time": 2.2801785907861548e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5130503911201692e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 369, - "real_time": 1.9046450360314695e+06, - "cpu_time": 2.2806039186989833e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5053617874374104e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 369, - "real_time": 1.9024787366587096e+06, - "cpu_time": 2.2807110542005086e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5116305890577042e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9033774337920598e+06, - "cpu_time": 2.2807307718157438e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5090298279733849e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9034304827083214e+06, - "cpu_time": 2.2806039186989833e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5088746845538568e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1489281162085083e+03, - "cpu_time": 5.1416961215488732e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3255475519078056e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.0362600491670345e-04, - "cpu_time": 2.2544073088712039e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0365393830717014e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 358, - "real_time": 1.9457454382774923e+06, - "cpu_time": 2.4736868463687715e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0778141676418591e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 358, - "real_time": 1.9468292343565498e+06, - "cpu_time": 2.4732928072627126e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0772141505739889e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 358, - "real_time": 1.9515229155915640e+06, - "cpu_time": 2.4783676117317048e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0746233022656009e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 358, - "real_time": 1.9471979506220149e+06, - "cpu_time": 2.4744999329608334e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0770101721450989e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 358, - "real_time": 1.9474227856792635e+06, - "cpu_time": 2.4752015027933489e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0768858285020583e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9477436649053772e+06, - "cpu_time": 2.4750097402234743e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0767095242257211e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9471979506220147e+06, - "cpu_time": 2.4744999329608330e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0770101721450989e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2086532201324444e+03, - "cpu_time": 2.0167972338433769e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2194957221409185e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1339547702955784e-03, - "cpu_time": 8.1486436237672173e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1326134808901937e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 346, - "real_time": 2.0338412307975329e+06, - "cpu_time": 2.8966130664740754e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0622573367515428e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 346, - "real_time": 2.0319137717543351e+06, - "cpu_time": 2.8925630346821821e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0642135794860415e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 346, - "real_time": 2.0289297358299782e+06, - "cpu_time": 2.8920062687861924e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0672495089063435e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 346, - "real_time": 2.0272788637777993e+06, - "cpu_time": 2.8918098612719094e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0689329302156222e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 346, - "real_time": 2.0271993324300544e+06, - "cpu_time": 2.8933491098265708e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0690140988613012e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0298325869179401e+06, - "cpu_time": 2.8932682682081861e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0663334908441701e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0289297358299785e+06, - "cpu_time": 2.8925630346821821e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0672495089063435e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9441139258828057e+03, - "cpu_time": 1.9628524180991913e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9954502930678050e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4504220421217562e-03, - "cpu_time": 6.7842046991197066e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4496451353765059e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 325, - "real_time": 2.1614762621286972e+06, - "cpu_time": 3.7429450830771974e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.8809623528960743e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 325, - "real_time": 2.1577642213266632e+06, - "cpu_time": 3.7390170307690613e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.8876388425990367e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 325, - "real_time": 2.1456681593106342e+06, - "cpu_time": 3.7325332369230702e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9095551488703237e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 325, - "real_time": 2.1565122726874859e+06, - "cpu_time": 3.7372111815385809e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.8898957850798416e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 325, - "real_time": 2.1481006574602085e+06, - "cpu_time": 3.7329256369230277e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.9051279887033844e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1539043145827381e+06, - "cpu_time": 3.7369264338461882e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.8946360236297321e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1565122726874859e+06, - "cpu_time": 3.7372111815385809e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.8898957850798416e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7184708983151386e+03, - "cpu_time": 4.3583933542926043e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2155876194960197e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1192058313958414e-03, - "cpu_time": 1.1663042961771067e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1211841417805035e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 174, - "real_time": 4.0116933731083898e+06, - "cpu_time": 7.1560809137932230e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1820783493730655e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 174, - "real_time": 4.0215958610990611e+06, - "cpu_time": 7.1681443563217996e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1717807008621097e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 174, - "real_time": 4.0156206988526145e+06, - "cpu_time": 7.1570842873561354e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1779882260278625e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 174, - "real_time": 4.0199370243875631e+06, - "cpu_time": 7.1682940574718509e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1735021962330384e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 174, - "real_time": 4.0263931585432985e+06, - "cpu_time": 7.1699990402300674e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1668101795776443e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0190480231981860e+06, - "cpu_time": 7.1639205310346158e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1744319304147449e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0199370243875631e+06, - "cpu_time": 7.1681443563217996e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.1735021962330384e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6362719156484700e+03, - "cpu_time": 6.7474167970603494e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8544741642747046e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4023897905960745e-03, - "cpu_time": 9.4186092207891711e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4024600860345186e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 90, - "real_time": 7.8837633236414855e+06, - "cpu_time": 1.4056749711110367e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2561440041431017e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 90, - "real_time": 7.8676477747244965e+06, - "cpu_time": 1.4069561077777356e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2648619969740553e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 90, - "real_time": 7.9819861592517961e+06, - "cpu_time": 1.4172058533333458e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2037697548632779e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 90, - "real_time": 7.8680405496723121e+06, - "cpu_time": 1.4054622166666932e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2646490937819929e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 90, - "real_time": 7.8749028862350518e+06, - "cpu_time": 1.4061762988887949e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2609327993938212e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8952681387050273e+06, - "cpu_time": 1.4082950895555213e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2500715298312502e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8749028862350509e+06, - "cpu_time": 1.4061762988887947e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.2609327993938212e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8916626713908445e+04, - "cpu_time": 5.0143306298083131e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6124508488133512e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1956890956121075e-03, - "cpu_time": 3.5605681415752924e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1468397189942802e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 46, - "real_time": 1.5262760383927304e+07, - "cpu_time": 2.7323593999999896e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.3969021534708805e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 46, - "real_time": 1.5263143197997756e+07, - "cpu_time": 2.7314231000001084e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.3967918750053692e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 46, - "real_time": 1.5292416245717069e+07, - "cpu_time": 2.7356930934783831e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.3883754484380522e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 46, - "real_time": 1.5032098223657712e+07, - "cpu_time": 2.6056694934783556e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4643710413216429e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 46, - "real_time": 1.5294343192616235e+07, - "cpu_time": 2.7352231913045235e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.3878225533999166e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5228952248783220e+07, - "cpu_time": 2.7080736556522720e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.4068526143271732e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5263143197997754e+07, - "cpu_time": 2.7323593999999892e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.3967918750053692e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1109362342198717e+05, - "cpu_time": 5.7274638786231936e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2450533389386375e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.2948960379637072e-03, - "cpu_time": 2.1149586779771929e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3636529807886118e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 23, - "real_time": 3.0112891984374627e+07, - "cpu_time": 5.2410173739130899e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4571517099601278e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 23, - "real_time": 3.0117247334640957e+07, - "cpu_time": 5.2338769260868303e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4565071471728535e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 23, - "real_time": 3.0122561623220857e+07, - "cpu_time": 5.2422950739133224e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4557209203793058e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 23, - "real_time": 3.0092251689537711e+07, - "cpu_time": 5.2379639521736071e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4602088731918983e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 23, - "real_time": 3.0144454668397490e+07, - "cpu_time": 5.2405086347829163e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4524848592039614e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0117881460034333e+07, - "cpu_time": 5.2391323921739534e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4564147019816294e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0117247334640957e+07, - "cpu_time": 5.2405086347829171e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.4565071471728535e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8776457646973373e+04, - "cpu_time": 3.3329765778772940e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7781495290498673e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.2343221822853826e-04, - "cpu_time": 6.3616956556699863e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2340462341049872e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.9363515675067902e+07, - "cpu_time": 9.9733661099992335e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5218928317741175e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.9164601191878319e+07, - "cpu_time": 9.9633707600003153e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5370956719446096e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.9197128564119339e+07, - "cpu_time": 9.9546580099990934e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5346026489991703e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.9718941897153854e+07, - "cpu_time": 9.8046241800000191e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.4949801096993876e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.9126920625567436e+07, - "cpu_time": 9.9608335999994323e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5399870847311497e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9314221590757385e+07, - "cpu_time": 9.9313705319996193e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5257116694296875e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9197128564119339e+07, - "cpu_time": 9.9608335999994323e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.5346026489991703e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4362221027860470e+05, - "cpu_time": 7.1173485084477556e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8516511533361785e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1073153072713857e-03, - "cpu_time": 7.1665320365554043e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0914032722051789e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.1534585431218147e+08, - "cpu_time": 1.8806281975000161e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6544448016915159e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.1593741737306118e+08, - "cpu_time": 1.9259290425000587e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6306958026541786e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.1553475540131330e+08, - "cpu_time": 1.8814828637499657e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6468347133740263e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.1599481571465731e+08, - "cpu_time": 1.9273312612499183e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6284043704218760e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.1540485359728336e+08, - "cpu_time": 1.8758924987500337e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6520652751180124e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1564353927969933e+08, - "cpu_time": 1.8982527727499989e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6424889926519222e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1553475540131330e+08, - "cpu_time": 1.8814828637499660e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.6468347133740263e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0297714211793581e+05, - "cpu_time": 2.5996979414341855e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2155119887691770e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6199227730755036e-03, - "cpu_time": 1.3695214771992686e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6182334318790531e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 2.0591312646865845e+08, - "cpu_time": 3.2382666050000352e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.2145380064608545e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 2.0644620433449745e+08, - "cpu_time": 3.2431641425000632e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.2010732164407063e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 2.0662897452712059e+08, - "cpu_time": 3.2549405199998206e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.1964726943900528e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 2.0605592802166939e+08, - "cpu_time": 3.2415575824998653e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.2109242102808247e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 2.0650283992290497e+08, - "cpu_time": 3.2501045950002092e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.1996467670898228e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0630941465497017e+08, - "cpu_time": 3.2456066889999992e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.2045309789324532e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0644620433449745e+08, - "cpu_time": 3.2431641425000632e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.2010732164407063e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0803533176601405e+05, - "cpu_time": 6.7747636396501435e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7743424728886234e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4930745273121406e-03, - "cpu_time": 2.0873643324100708e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4937642804622687e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8465842129072938e+06, - "cpu_time": 2.0683208115184263e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2181495820064377e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8511216136718630e+06, - "cpu_time": 2.0724831780104109e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2127125358745190e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8467932190943854e+06, - "cpu_time": 2.0680959921466508e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2178985484950836e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8412949712143990e+06, - "cpu_time": 2.0684308089007146e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2245213635154520e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8414499327501997e+06, - "cpu_time": 2.0690049214659233e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2243341657856731e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8454487899276279e+06, - "cpu_time": 2.0692671424084255e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2195232391354330e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8465842129072933e+06, - "cpu_time": 2.0684308089007144e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2181495820064377e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1389211453164153e+03, - "cpu_time": 1.8288133882577890e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9759043158994054e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2427721472990476e-03, - "cpu_time": 8.8379762611473576e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2418798002032457e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8465305973089384e+06, - "cpu_time": 2.0693080811518996e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4364279757609768e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8515576493930309e+06, - "cpu_time": 2.0737806910992803e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4243828987368904e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8475077786825411e+06, - "cpu_time": 2.0696796701570686e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4340814661368951e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8426901457056585e+06, - "cpu_time": 2.0699525366491647e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4456741786410715e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8423789499319312e+06, - "cpu_time": 2.0701090628271522e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4464250963693773e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8461330242044199e+06, - "cpu_time": 2.0705660083769131e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4373983231290430e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8465305973089382e+06, - "cpu_time": 2.0699525366491645e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4364279757609768e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7888342100649861e+03, - "cpu_time": 1.8225880050113374e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1010549659993067e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0523083441929984e-03, - "cpu_time": 8.8023661049088588e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0509889586792095e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8483568434747122e+06, - "cpu_time": 2.0725939737532800e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8640892357126456e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8535680207469699e+06, - "cpu_time": 2.0782530971129788e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8391684667700548e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8483190651750192e+06, - "cpu_time": 2.0722750787401879e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8642704112607222e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8445302544679893e+06, - "cpu_time": 2.0731965459317460e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8824783222249579e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8483438246476762e+06, - "cpu_time": 2.0725053018374669e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8641516700081769e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8486236017024736e+06, - "cpu_time": 2.0737647994751320e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8628316211953126e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8483438246476762e+06, - "cpu_time": 2.0725939737532798e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8641516700081769e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2188875762509256e+03, - "cpu_time": 2.5320032983780834e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5421834996148724e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7412347074258489e-03, - "cpu_time": 1.2209693688594440e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7400573152340686e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8511144930889907e+06, - "cpu_time": 2.0782076870025520e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7701768379177563e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8551378677718327e+06, - "cpu_time": 2.0826713660475174e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7663377245032985e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8495802567978092e+06, - "cpu_time": 2.0786585039790205e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7716452086665034e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8444462418665835e+06, - "cpu_time": 2.0785867267904447e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7765765819685109e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8488328803709859e+06, - "cpu_time": 2.0779301644562962e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7723613825725984e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8498223479792406e+06, - "cpu_time": 2.0792108896551661e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7714195471257340e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8495802567978096e+06, - "cpu_time": 2.0785867267904449e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7716452086665034e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8686095975724661e+03, - "cpu_time": 1.9568008762149177e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7048020474699457e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0913411505697095e-03, - "cpu_time": 9.4112669664761592e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0914311651812102e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8501916252678209e+06, - "cpu_time": 2.0847361329786996e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5421195893973127e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8559700306371830e+06, - "cpu_time": 2.0913366542555543e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5310915003029704e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8500712571465634e+06, - "cpu_time": 2.0849889707448562e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5423500444560558e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8460308154781740e+06, - "cpu_time": 2.0857780558511431e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5501032512842603e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8501065833527506e+06, - "cpu_time": 2.0850115664891389e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5422824063052684e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8504740623764987e+06, - "cpu_time": 2.0863702760638786e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5415893583491735e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8501065833527506e+06, - "cpu_time": 2.0850115664891389e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5422824063052684e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5470119017843012e+03, - "cpu_time": 2.8035761464586894e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7829105155898971e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9168125476068541e-03, - "cpu_time": 1.3437577109983961e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9152165396023179e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8505312777864325e+06, - "cpu_time": 2.0996436223402298e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0829389145362422e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8549917113751746e+06, - "cpu_time": 2.1040223723406252e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0659075831035078e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8470027092955709e+06, - "cpu_time": 2.0994837473404850e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0964703700943455e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8501074259705655e+06, - "cpu_time": 2.0996872446810333e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0845615859976187e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8469418861214046e+06, - "cpu_time": 2.0998097047873535e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0967040698423073e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8499150021098300e+06, - "cpu_time": 2.1005293382979454e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0853165047148049e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8501074259705651e+06, - "cpu_time": 2.0996872446810333e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0845615859976187e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2981308239959458e+03, - "cpu_time": 1.9561463443958007e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2619572376372346e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7828553313176143e-03, - "cpu_time": 9.3126351949973814e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7810880245046025e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 380, - "real_time": 1.8593009536025897e+06, - "cpu_time": 2.1291140947366063e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4099062311137345e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 380, - "real_time": 1.8576057919601321e+06, - "cpu_time": 2.1273989052630034e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4111928436839527e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 380, - "real_time": 1.8590386645212821e+06, - "cpu_time": 2.1285741105262595e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4101051527484196e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 380, - "real_time": 1.8578790737879709e+06, - "cpu_time": 2.1279806026316956e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4109852664712074e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 380, - "real_time": 1.8574335843272579e+06, - "cpu_time": 2.1278603473684886e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4113236791448760e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8582516136398464e+06, - "cpu_time": 2.1281856121052108e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4107026346324381e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8578790737879705e+06, - "cpu_time": 2.1279806026316956e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4109852664712074e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5813853509059720e+02, - "cpu_time": 6.6703536399066138e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5136877458164970e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6179889138356237e-04, - "cpu_time": 3.1342912958180703e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6173357771559371e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 374, - "real_time": 1.8801808518788374e+06, - "cpu_time": 2.1903311711229249e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7884977100797862e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 374, - "real_time": 1.8738428498668110e+06, - "cpu_time": 2.1858072807487543e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7979293996679890e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 374, - "real_time": 1.8788503462238295e+06, - "cpu_time": 2.1890416363636605e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7904723814418209e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 374, - "real_time": 1.8816713637013715e+06, - "cpu_time": 2.1915268663102123e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7862888818624043e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 374, - "real_time": 1.8834852625025725e+06, - "cpu_time": 2.1915159893049905e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7836055340479940e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8796061348346844e+06, - "cpu_time": 2.1896445887701083e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7893587814199990e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8801808518788372e+06, - "cpu_time": 2.1903311711229249e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7884977100797862e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6547835592560705e+03, - "cpu_time": 2.3772351842871863e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4304968608774652e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9444411738832276e-03, - "cpu_time": 1.0856717096825493e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9468620878211023e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8741139823024685e+06, - "cpu_time": 2.2706852765956097e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5950492334076583e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8777918725236112e+06, - "cpu_time": 2.2731451010637912e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5840906297607553e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8734845989650025e+06, - "cpu_time": 2.2699508111703559e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5969288489442647e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8795914437121495e+06, - "cpu_time": 2.2739890797871058e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5787442718354094e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8741803730161802e+06, - "cpu_time": 2.2707517819147245e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5948510351353860e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8758324541038827e+06, - "cpu_time": 2.2717044101063171e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5899328038166940e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8741803730161800e+06, - "cpu_time": 2.2707517819147245e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5948510351353860e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7001974196628680e+03, - "cpu_time": 1.7547470473341248e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0409225858728425e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4394662027280036e-03, - "cpu_time": 7.7243634318251880e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4384649812574960e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 367, - "real_time": 1.9180650874523178e+06, - "cpu_time": 2.4724894087191513e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0933685273347816e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 367, - "real_time": 1.9170274531052574e+06, - "cpu_time": 2.4719248583105160e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0939603377108512e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 367, - "real_time": 1.9192116511719204e+06, - "cpu_time": 2.4721809782016124e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0927153337775042e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 367, - "real_time": 1.9185245826926681e+06, - "cpu_time": 2.4719481198911672e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0931066606697457e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 367, - "real_time": 1.9160635699264260e+06, - "cpu_time": 2.4722161144412332e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0945106586836927e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9177784688697183e+06, - "cpu_time": 2.4721518959127362e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0935323036353152e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9180650874523178e+06, - "cpu_time": 2.4721809782016124e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0933685273347816e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2447640960998162e+03, - "cpu_time": 2.3019308564146294e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0989895912023983e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.4906563312990126e-04, - "cpu_time": 9.3114458711880251e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4917968747723969e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 349, - "real_time": 2.0130427786413271e+06, - "cpu_time": 2.8910676361029074e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0835642662451925e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 349, - "real_time": 2.0134091186457258e+06, - "cpu_time": 2.8902243925501243e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0831851615041876e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 349, - "real_time": 2.0105927858373583e+06, - "cpu_time": 2.8899593667621571e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0861031779009316e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 349, - "real_time": 2.0120204469712081e+06, - "cpu_time": 2.8910821948426035e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0846229501861618e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 349, - "real_time": 2.0097575225816627e+06, - "cpu_time": 2.8902853123209807e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0869701707159910e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0117645305354570e+06, - "cpu_time": 2.8905237805157551e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0848891453104928e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0120204469712086e+06, - "cpu_time": 2.8902853123209807e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0846229501861618e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5656586519223940e+03, - "cpu_time": 5.1784857360161959e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6228267827220501e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7825144451954020e-04, - "cpu_time": 1.7915388798815562e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7837557280791068e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 342, - "real_time": 2.0459876392358011e+06, - "cpu_time": 3.6549505292396401e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1000286801015267e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 342, - "real_time": 2.0413073470777893e+06, - "cpu_time": 3.6527593128655278e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1094291910567112e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 342, - "real_time": 2.0431291631270438e+06, - "cpu_time": 3.6574717807016037e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1057648979769311e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 342, - "real_time": 2.0479277700147650e+06, - "cpu_time": 3.6541516345030349e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0961444650655427e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 342, - "real_time": 2.0484733014035295e+06, - "cpu_time": 3.6551721783626280e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0950536159062810e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0453650441717855e+06, - "cpu_time": 3.6549010871344870e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1012841700213985e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0459876392358008e+06, - "cpu_time": 3.6549505292396396e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.1000286801015267e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0854708364498656e+03, - "cpu_time": 1.7199765002632817e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1893238167153606e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5085184159384331e-03, - "cpu_time": 4.7059454120871328e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5091185004825129e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 189, - "real_time": 3.7035002107066768e+06, - "cpu_time": 6.8695707460319046e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5300972176261024e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 189, - "real_time": 3.7059103170774444e+06, - "cpu_time": 6.8878807671958692e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5271511085111341e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 189, - "real_time": 3.7058799012647890e+06, - "cpu_time": 6.8893471164021138e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5271882648636456e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 189, - "real_time": 3.7128911193499649e+06, - "cpu_time": 6.8993391481482163e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5186393731193695e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 189, - "real_time": 3.7027890769341006e+06, - "cpu_time": 6.8877987619047156e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5309672388607912e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7061941250665956e+06, - "cpu_time": 6.8867873079365641e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5268086405962095e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7058799012647890e+06, - "cpu_time": 6.8878807671958702e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5271882648636456e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9962652367073542e+03, - "cpu_time": 1.0755580041612175e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8761411056203041e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0782665726220013e-03, - "cpu_time": 1.5617703234739200e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0771697000600594e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 95, - "real_time": 7.4726483980683908e+06, - "cpu_time": 1.3944482599999661e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4902998525493994e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 95, - "real_time": 7.4799326444534883e+06, - "cpu_time": 1.3947055947368139e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4859270256773300e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 95, - "real_time": 7.7806822318387656e+06, - "cpu_time": 1.3941250221053354e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.3125308295838556e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 95, - "real_time": 7.4766584966135649e+06, - "cpu_time": 1.3945731252631862e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4878914845713434e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 95, - "real_time": 7.4719663807436042e+06, - "cpu_time": 1.3941099736842645e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4907097128374243e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5363776303435620e+06, - "cpu_time": 1.3943923951579133e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4534717810438709e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4766584966135649e+06, - "cpu_time": 1.3944482599999661e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.4878914845713434e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3660835790565636e+05, - "cpu_time": 2.6698710934991873e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8812088394919723e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8126527704189467e-02, - "cpu_time": 1.9147200621363308e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7696775071166293e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4596219364629716e+07, - "cpu_time": 2.7057142326528411e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5976880946734419e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4625724728162192e+07, - "cpu_time": 2.7100937122447841e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5884128990052872e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4618100427395226e+07, - "cpu_time": 2.7086246714284986e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5908060580999861e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4627439026929894e+07, - "cpu_time": 2.7120765367346060e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5878751486469374e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4601695218256542e+07, - "cpu_time": 2.7084106571430068e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5959638930206947e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4613835753074717e+07, - "cpu_time": 2.7089839620407481e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5921492186892700e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4618100427395228e+07, - "cpu_time": 2.7086246714284986e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5908060580999861e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4162573588869040e+04, - "cpu_time": 2.3422458380691449e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4514808567037554e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.6912089530561954e-04, - "cpu_time": 8.6462152264078752e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6936764131857513e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.8262508660554886e+07, - "cpu_time": 5.1237790079999283e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7489672488742504e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.5042227208614349e+07, - "cpu_time": 4.9233317079997502e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.3596561872032709e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8291513621807098e+07, - "cpu_time": 5.1304395080001086e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7440985234718933e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.8223506882786751e+07, - "cpu_time": 5.1166709079998329e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7555297985261402e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.8248172327876091e+07, - "cpu_time": 5.1222821999999724e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7513774145150681e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7613585740327835e+07, - "cpu_time": 5.0833006663999192e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8719258345181246e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8248172327876091e+07, - "cpu_time": 5.1222821999999724e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7513774145150681e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4376435410606305e+06, - "cpu_time": 8.9559710757649131e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7268089909412926e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.2062906808985912e-02, - "cpu_time": 1.7618416976518697e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5969837874410039e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.4906305670738220e+07, - "cpu_time": 9.5782241400002033e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8889731829664888e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.2032082155346870e+07, - "cpu_time": 9.2615387800003648e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.1590373646505184e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.4992497712373734e+07, - "cpu_time": 9.5815661000006005e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8813104908235502e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.5000162869691849e+07, - "cpu_time": 9.6020878100000575e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8806302016956911e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.4992417618632317e+07, - "cpu_time": 9.5991630200001046e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8813176002113018e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4384693205356613e+07, - "cpu_time": 9.5245159700002670e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9382537680695105e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4992417618632317e+07, - "cpu_time": 9.5815661000006005e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.8813176002113018e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3157143027291538e+06, - "cpu_time": 1.4738203736602277e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2346934034696193e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4192731910080225e-02, - "cpu_time": 1.5473966113368664e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5002631728913611e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0720609128475189e+08, - "cpu_time": 1.8399000837499103e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0078396252131624e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0387394763529301e+08, - "cpu_time": 1.7877492612498713e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1684847280954657e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0741833131760359e+08, - "cpu_time": 1.8435018425000748e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 4.9979450007711878e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0411288961768150e+08, - "cpu_time": 1.7962440137500834e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1566229116440077e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0735198855400085e+08, - "cpu_time": 1.8430539774999487e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0010336951507883e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0599264968186617e+08, - "cpu_time": 1.8220898357499781e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0663851921749220e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0720609128475189e+08, - "cpu_time": 1.8399000837499100e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0078396252131624e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8286065104648801e+06, - "cpu_time": 2.7669729751309012e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7962524156262815e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7252201128600791e-02, - "cpu_time": 1.5185711049159147e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7361989035520185e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 2.0024105906486511e+08, - "cpu_time": 3.1605518474998462e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3622460299322395e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 2.0016381517052650e+08, - "cpu_time": 3.1430412149998689e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3643153388400497e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 2.0056834071874619e+08, - "cpu_time": 3.1479226499999416e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3534960709760828e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.9983509555459023e+08, - "cpu_time": 3.1487899025000840e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3731393928584433e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 2.0072638243436813e+08, - "cpu_time": 3.1603766949999112e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3492810012210693e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0030693858861923e+08, - "cpu_time": 3.1521364619999301e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3604955667655773e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0024105906486511e+08, - "cpu_time": 3.1487899025000846e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.3622460299322395e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5061534712040267e+05, - "cpu_time": 7.9120057990826736e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3845689820342846e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7503904237709887e-03, - "cpu_time": 2.5100454547144690e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7506905593239316e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8421500724551568e+06, - "cpu_time": 2.0726039660572810e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2234887706738170e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8388882782861928e+06, - "cpu_time": 2.0693747728461192e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2274327637877981e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8347040155281522e+06, - "cpu_time": 2.0696619712794907e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2325126916021346e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8399075880093807e+06, - "cpu_time": 2.0691840757179037e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2261987649235763e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8438532814259189e+06, - "cpu_time": 2.0737469738903223e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2214348838170106e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8399006471409600e+06, - "cpu_time": 2.0709143519582234e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2262135749608674e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8399075880093810e+06, - "cpu_time": 2.0696619712794907e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2261987649235763e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4897403566607813e+03, - "cpu_time": 2.1101634940485119e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2256939855393966e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8967004343867823e-03, - "cpu_time": 1.0189525665574607e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8981530043062811e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8442301836862369e+06, - "cpu_time": 2.0753741253262507e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4419617857169416e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8392634461899821e+06, - "cpu_time": 2.0701933315924972e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4539568363464484e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8374140940443370e+06, - "cpu_time": 2.0737829425585889e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4584397314426647e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8388476525874098e+06, - "cpu_time": 2.0702373315929098e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4549639490107745e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8436713067814100e+06, - "cpu_time": 2.0768846605744101e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4433082892097440e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8406853366578750e+06, - "cpu_time": 2.0732944783289314e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4505261183453146e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8392634461899821e+06, - "cpu_time": 2.0737829425585889e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4539568363464484e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0652015233736497e+03, - "cpu_time": 3.0172916140780453e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4083447897903661e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6652501447852700e-03, - "cpu_time": 1.4553126174869152e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6645997782717776e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8473630021408310e+06, - "cpu_time": 2.0796710652739564e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8688579239777308e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8414918382266990e+06, - "cpu_time": 2.0746948851175616e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8971341929906663e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8373890632683565e+06, - "cpu_time": 2.0754014334202693e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9170009376544692e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8424472651560183e+06, - "cpu_time": 2.0749037911228430e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8925204589845371e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8571146959761113e+06, - "cpu_time": 2.0903057467363426e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8222876247223187e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8451611729536031e+06, - "cpu_time": 2.0789953843341947e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8795602276659440e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8424472651560181e+06, - "cpu_time": 2.0754014334202693e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.8925204589845371e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5658734831055363e+03, - "cpu_time": 6.6432814575144166e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6308776382878495e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1003862394278666e-03, - "cpu_time": 3.1954286707769433e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0890286739372131e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8490496928013095e+06, - "cpu_time": 2.0860477905760049e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7721535623175435e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8426052712601018e+06, - "cpu_time": 2.0802116570678507e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7783515824629635e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8387970938429565e+06, - "cpu_time": 2.0812491780103273e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7820345762847163e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8426823443172411e+06, - "cpu_time": 2.0799701832460540e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7782772001400679e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8475100154109562e+06, - "cpu_time": 2.0845806675391947e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7736304391676683e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8441288835265129e+06, - "cpu_time": 2.0824118952878867e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7768894720745917e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8426823443172411e+06, - "cpu_time": 2.0812491780103273e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7782772001400679e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1378819457939671e+03, - "cpu_time": 2.7421809300212767e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9870349265423734e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2438138585417784e-03, - "cpu_time": 1.3168292671715551e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2438283242723848e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 382, - "real_time": 1.8490090714156546e+06, - "cpu_time": 2.0913382958114964e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5443849904870257e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 382, - "real_time": 1.8442446537832706e+06, - "cpu_time": 2.0867850680626852e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5535415469720848e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 382, - "real_time": 1.8490266731189911e+06, - "cpu_time": 2.0968170575916104e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5443512499174498e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 382, - "real_time": 1.8467041306694085e+06, - "cpu_time": 2.0898198429320457e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5488088704411991e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 382, - "real_time": 1.8481089780320467e+06, - "cpu_time": 2.0910105863874084e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5461112293164559e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8474187014038744e+06, - "cpu_time": 2.0911541701570493e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5474395774268433e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8481089780320465e+06, - "cpu_time": 2.0910105863874082e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5461112293164559e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0110023162121311e+03, - "cpu_time": 3.6397903410918798e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8646401049289183e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0885471250691287e-03, - "cpu_time": 1.7405652787515543e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0894167527251185e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8476445676425141e+06, - "cpu_time": 2.1036261749345884e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0940051076620311e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8416928011448642e+06, - "cpu_time": 2.0975615796344471e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1169306802155510e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8494914593746490e+06, - "cpu_time": 2.1029704804178430e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0869210742026418e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8409780144123677e+06, - "cpu_time": 2.0982375770234512e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1196939330010206e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8483944312917364e+06, - "cpu_time": 2.1027481540467693e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0911271848185197e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8456402547732263e+06, - "cpu_time": 2.1010287932114201e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1017355959799528e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8476445676425141e+06, - "cpu_time": 2.1027481540467693e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.0940051076620311e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9922866438279293e+03, - "cpu_time": 2.8846663801736222e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5371738239379437e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1630903603792827e-03, - "cpu_time": 1.3729780331874527e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1645044414327179e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8437174088511069e+06, - "cpu_time": 2.1220168188973828e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4218230990363771e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8506196888653792e+06, - "cpu_time": 2.1262741758530764e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4165201071686497e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8494744966780704e+06, - "cpu_time": 2.1247885800524573e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4173972145647284e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8511147997534547e+06, - "cpu_time": 2.1261485905512171e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4161412357294872e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8506726036777140e+06, - "cpu_time": 2.1259719553803774e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4164796057339334e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8491197995651450e+06, - "cpu_time": 2.1250400241469024e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4176722524466354e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8506196888653792e+06, - "cpu_time": 2.1259719553803774e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4165201071686497e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0802812268848470e+03, - "cpu_time": 1.7904985228232515e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3663806940135392e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6658094449095362e-03, - "cpu_time": 8.4257167040514814e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6692015308401584e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 377, - "real_time": 1.8709263801685872e+06, - "cpu_time": 2.1862395331563847e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8022909161864346e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 377, - "real_time": 1.8763027216594380e+06, - "cpu_time": 2.1917145809018970e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7942612561810374e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 377, - "real_time": 1.8762896063308965e+06, - "cpu_time": 2.1884845145890196e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7942807881628174e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 377, - "real_time": 1.8757027482789315e+06, - "cpu_time": 2.1878163633952779e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7951550451214367e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 377, - "real_time": 1.8757544488019855e+06, - "cpu_time": 2.1884645570290061e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7950780035993218e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8749951810479679e+06, - "cpu_time": 2.1885439098143172e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7962132018502098e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8757544488019857e+06, - "cpu_time": 2.1884645570290061e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7950780035993218e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2922411942881054e+03, - "cpu_time": 1.9938941407494913e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4238610091532627e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2225317789920564e-03, - "cpu_time": 9.1105969215790573e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2244635018845303e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 379, - "real_time": 1.8740940875451188e+06, - "cpu_time": 2.2680971398416646e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5951086285829592e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 379, - "real_time": 1.8682057206275675e+06, - "cpu_time": 2.2638783773087524e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6127437595457232e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 379, - "real_time": 1.8778234649735866e+06, - "cpu_time": 2.2703807651714310e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5839966831746316e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 379, - "real_time": 1.8769200396875171e+06, - "cpu_time": 2.2739890923481886e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5866844502047849e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 379, - "real_time": 1.8742114155292807e+06, - "cpu_time": 2.2688146596304448e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5947583677686667e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8742509456726140e+06, - "cpu_time": 2.2690320068600965e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5946583778553522e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8742114155292804e+06, - "cpu_time": 2.2688146596304448e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.5947583677686667e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7569226092862182e+03, - "cpu_time": 3.6699100542305432e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1231084211953892e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0044928444402990e-03, - "cpu_time": 1.6173901659981393e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0074655954702278e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 366, - "real_time": 1.9187165077208271e+06, - "cpu_time": 2.4691100874318806e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0929973195941956e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 366, - "real_time": 1.9166553033581972e+06, - "cpu_time": 2.4675474262295594e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0941727478725843e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 366, - "real_time": 1.9170295121402689e+06, - "cpu_time": 2.4675742814207179e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0939591627145236e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 366, - "real_time": 1.9181075183384607e+06, - "cpu_time": 2.4680288797812765e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0933443406846318e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 366, - "real_time": 1.9187868733081173e+06, - "cpu_time": 2.4694711748633790e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0929572372904394e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9178591429731746e+06, - "cpu_time": 2.4683463699453631e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0934861616312749e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9181075183384609e+06, - "cpu_time": 2.4680288797812765e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0933443406846318e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7403353919259848e+02, - "cpu_time": 8.9214380256776440e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5542131957640953e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0787543118656581e-04, - "cpu_time": 3.6143379771596320e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0793630414839978e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 348, - "real_time": 2.0160473847692171e+06, - "cpu_time": 2.8773849885059744e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0804590366709733e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 348, - "real_time": 2.0210032820321575e+06, - "cpu_time": 2.8825611379309664e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0753573422120061e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 348, - "real_time": 2.0142905912549372e+06, - "cpu_time": 2.8765861321839262e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0822735399795899e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 348, - "real_time": 2.0140643588176274e+06, - "cpu_time": 2.8780579425287396e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0825074341031978e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 348, - "real_time": 2.0120837080062251e+06, - "cpu_time": 2.8772296091952692e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0845574084768763e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0154978649760329e+06, - "cpu_time": 2.8783639620689759e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0810309522885289e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0142905912549377e+06, - "cpu_time": 2.8773849885059744e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0822735399795899e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3830646802996648e+03, - "cpu_time": 2.4039424880061338e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4884400072009265e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6785255589143947e-03, - "cpu_time": 8.3517669053852868e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6763037586560916e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 337, - "real_time": 2.0696820773444076e+06, - "cpu_time": 3.6234149169139820e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0530901300374384e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 337, - "real_time": 2.0703424997379016e+06, - "cpu_time": 3.6245914243321349e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0517972273002996e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 337, - "real_time": 2.0670214165637726e+06, - "cpu_time": 3.6241811869435189e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0583072496390800e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 337, - "real_time": 2.0727762259482141e+06, - "cpu_time": 3.6242709999997290e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0470398564912806e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 337, - "real_time": 2.0653036829272080e+06, - "cpu_time": 3.6237895964393276e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0616825841856875e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0690251805043011e+06, - "cpu_time": 3.6240496249257391e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0543834095307574e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0696820773444078e+06, - "cpu_time": 3.6241811869435189e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0530901300374384e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9198373022969940e+03, - "cpu_time": 4.5561254521534954e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7219566900003711e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4112140005881019e-03, - "cpu_time": 1.2571917947306962e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4113013279774182e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 192, - "real_time": 3.6500133173831273e+06, - "cpu_time": 6.6844505572915366e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5964807635355167e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 192, - "real_time": 3.6519199711619876e+06, - "cpu_time": 6.6911448385417545e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5940809580944166e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 192, - "real_time": 3.6467450033039008e+06, - "cpu_time": 6.6815051822916390e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6006002571608582e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 192, - "real_time": 3.6581350298850643e+06, - "cpu_time": 6.6960100052083274e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5862757560721121e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 192, - "real_time": 3.6469682975924420e+06, - "cpu_time": 6.6835944166664751e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6003185744925547e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6507563238653047e+06, - "cpu_time": 6.6873409999999478e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5955512618710918e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6500133173831268e+06, - "cpu_time": 6.6844505572915366e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.5964807635355167e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6580916660305502e+03, - "cpu_time": 6.0429536022811353e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8583358864715155e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2759251105257858e-03, - "cpu_time": 9.0364071493904421e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2747841450660431e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 97, - "real_time": 7.4139026800151337e+06, - "cpu_time": 1.3824893556700997e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5258797489275255e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 97, - "real_time": 7.4109567050850885e+06, - "cpu_time": 1.3827419412370883e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5276788591918707e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 97, - "real_time": 7.4135843357167291e+06, - "cpu_time": 1.3798558670102756e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5260740932484493e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 97, - "real_time": 7.4144865856649950e+06, - "cpu_time": 1.3862988835052015e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5255233268441544e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 97, - "real_time": 7.4151035340637276e+06, - "cpu_time": 1.3817825010308757e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5251467961110229e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4136067681091353e+06, - "cpu_time": 1.3826337096907083e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5260605648646040e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4139026800151337e+06, - "cpu_time": 1.3824893556700995e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5258797489275255e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5910129055633038e+03, - "cpu_time": 2.3402466418205997e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7151325425853045e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1460713460111087e-04, - "cpu_time": 1.6926005965412973e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1464875255985290e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4598022633213170e+07, - "cpu_time": 2.6711362836733442e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5971201501849346e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4579789047794683e+07, - "cpu_time": 2.6738295612246048e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6028693405650330e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4619260209099371e+07, - "cpu_time": 2.6772824081634250e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5904418582159081e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4571795582163090e+07, - "cpu_time": 2.6728643653061170e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6053942783925686e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4586992181685505e+07, - "cpu_time": 2.6735653918366350e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6005964193397999e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4591171930791164e+07, - "cpu_time": 2.6737356020408254e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.5992844093396482e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4586992181685507e+07, - "cpu_time": 2.6735653918366350e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6005964193397999e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8428013431421845e+04, - "cpu_time": 2.2434985474255573e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8047034823287912e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2629563628493712e-03, - "cpu_time": 8.3908765912124063e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2620883958690029e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.8088959902524948e+07, - "cpu_time": 5.0339473200001515e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7783089322554455e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.8152569979429245e+07, - "cpu_time": 5.0403958599999897e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7675124543894691e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8096582219004631e+07, - "cpu_time": 5.0317505599996366e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7770126257283573e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.8130265772342682e+07, - "cpu_time": 5.0390466840003684e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7712925674510031e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.8115712553262711e+07, - "cpu_time": 5.0310343319997624e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7737622777916965e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8116818085312851e+07, - "cpu_time": 5.0352349511999816e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7735777715231953e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time_median", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8115712553262711e+07, - "cpu_time": 5.0339473200001523e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7737622777916965e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5718811465242183e+04, - "cpu_time": 4.2605300256099385e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3653859331060294e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.1471273126302684e-04, - "cpu_time": 8.4614324195429681e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1448932897831127e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.4613450169563293e+07, - "cpu_time": 9.4311862099993959e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9151894847617989e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.4540522024035454e+07, - "cpu_time": 9.4188465599995643e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9217617660810661e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.4544457793235779e+07, - "cpu_time": 9.4104660300001800e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9214066260878572e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 4.9170000478625298e+07, - "cpu_time": 9.1761324000003695e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.4593340123454266e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.4541722312569618e+07, - "cpu_time": 9.4207825800003782e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9216534538759279e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3482030555605888e+07, - "cpu_time": 9.3714827559999779e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0278690686304150e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time_median", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4541722312569618e+07, - "cpu_time": 9.4188465599995643e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9216534538759279e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4106957590811700e+06, - "cpu_time": 1.0945291480371244e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4121227913393396e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5074873448844498e-02, - "cpu_time": 1.1679359355768599e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7975051824418309e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0172288864850998e+08, - "cpu_time": 1.7617778375000626e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2777788670068798e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 1.0673330724239349e+08, - "cpu_time": 1.8159297537499696e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0300222664398031e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0171758383512497e+08, - "cpu_time": 1.7591166687500960e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2780541156995955e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 1.0687513183802366e+08, - "cpu_time": 1.8188923112499821e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0233473659116831e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0180090554058552e+08, - "cpu_time": 1.7678046224999377e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2737341495057993e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0376996342092752e+08, - "cpu_time": 1.7847042387500098e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1765873529127522e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time_median", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0180090554058552e+08, - "cpu_time": 1.7678046224999377e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.2737341495057993e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7705344036383042e+06, - "cpu_time": 3.0040796138109593e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3687270066773024e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6698808714040307e-02, - "cpu_time": 1.6832366666619164e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6440720756062384e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8560825288295746e+08, - "cpu_time": 3.1317242525000209e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7849896614084826e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8542753159999847e+08, - "cpu_time": 3.1282622100002301e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7906278249783316e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8527872487902641e+08, - "cpu_time": 3.1191100350000054e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7952785712502909e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8555964156985283e+08, - "cpu_time": 3.1290797925001359e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7865051630626059e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8527125194668770e+08, - "cpu_time": 3.1231620375001514e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7955123243241863e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8542908057570460e+08, - "cpu_time": 3.1262676655001086e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7905827090047798e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time_median", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8542753159999847e+08, - "cpu_time": 3.1282622100002301e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7906278249783316e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5545738954361441e+05, - "cpu_time": 5.0630328698259249e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8544522649790263e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.3836574641347203e-04, - "cpu_time": 1.6195135578757271e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.3833570970845439e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 384, - "real_time": 1.8392240839564996e+06, - "cpu_time": 2.0731707968749311e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2270260789477988e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 384, - "real_time": 1.8353011443916026e+06, - "cpu_time": 2.0687297552080725e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2317863270105533e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 384, - "real_time": 1.8312123837252632e+06, - "cpu_time": 2.0692872630207285e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2367694956646399e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 384, - "real_time": 1.8339949891128528e+06, - "cpu_time": 2.0673252968750333e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2333757858200767e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 384, - "real_time": 1.8417149730301693e+06, - "cpu_time": 2.0753482421875801e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2240140629691798e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8362895148432776e+06, - "cpu_time": 2.0707722708332692e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2305943500824496e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time_median", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8353011443916026e+06, - "cpu_time": 2.0692872630207285e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.2317863270105533e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1852800767488798e+03, - "cpu_time": 3.3522823851744602e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0823802028785021e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2792049090941320e-03, - "cpu_time": 1.6188561303390047e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2784869883179979e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 384, - "real_time": 1.8353736700191803e+06, - "cpu_time": 2.0694872708334106e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4633962739121076e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 384, - "real_time": 1.8286399621464016e+06, - "cpu_time": 2.0680846145832988e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4798320990341259e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 384, - "real_time": 1.8302132919908825e+06, - "cpu_time": 2.0696319713543095e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4759810432197489e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 384, - "real_time": 1.8339162383161541e+06, - "cpu_time": 2.0676207760415012e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4669433798795762e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 384, - "real_time": 1.8386333635286670e+06, - "cpu_time": 2.0728169088541174e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4554831661914820e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8333553052002571e+06, - "cpu_time": 2.0695283083333275e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4683271924474081e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time_median", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8339162383161546e+06, - "cpu_time": 2.0694872708334110e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.4669433798795762e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0110176184860552e+03, - "cpu_time": 2.0341002048977200e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7742290294486756e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1878015718551250e-03, - "cpu_time": 9.8288107328952691e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1874470262539347e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 384, - "real_time": 1.8346516044213483e+06, - "cpu_time": 2.0704578723957923e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9303058741594367e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 384, - "real_time": 1.8307999760433326e+06, - "cpu_time": 2.0714236640625808e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9490934096517656e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 384, - "real_time": 1.8309274576608913e+06, - "cpu_time": 2.0712248281249402e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9484703129262384e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 384, - "real_time": 1.8353020432944808e+06, - "cpu_time": 2.0707376406251162e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9271409356629420e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 384, - "real_time": 1.8401604312051253e+06, - "cpu_time": 2.0756572369794075e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9035715159194469e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8343683025250356e+06, - "cpu_time": 2.0719002484375674e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9317164096639659e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time_median", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8346516044213485e+06, - "cpu_time": 2.0712248281249399e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.9303058741594367e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8429563390148032e+03, - "cpu_time": 2.1348532584980621e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8693000158920619e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0949753295043945e-03, - "cpu_time": 1.0303841896384578e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0928788265931852e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 384, - "real_time": 1.8379525645097299e+06, - "cpu_time": 2.0765343749999944e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7828534116026439e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 384, - "real_time": 1.8319450124219356e+06, - "cpu_time": 2.0765649296876632e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7886999761351377e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 384, - "real_time": 1.8336800533613011e+06, - "cpu_time": 2.0770974895834017e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7870074956606142e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 384, - "real_time": 1.8375908928192074e+06, - "cpu_time": 2.0763819817706991e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7832043099499568e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 384, - "real_time": 1.8425534165089631e+06, - "cpu_time": 2.0813165781250475e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7784016303898890e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8367443879242279e+06, - "cpu_time": 2.0775790708333612e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7840333647476483e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time_median", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8375908928192076e+06, - "cpu_time": 2.0765649296876632e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.7832043099499568e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1335585703741262e+03, - "cpu_time": 2.1067614439621802e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0130652152531737e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2504811216794364e-03, - "cpu_time": 1.0140463357272429e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2494339481262011e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8386862199089683e+06, - "cpu_time": 2.0829171801564700e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5642840681780182e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8343728774074614e+06, - "cpu_time": 2.0835201409919818e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5726651220782720e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8353993087733716e+06, - "cpu_time": 2.0850296631853385e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5706671396644913e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8392639762900376e+06, - "cpu_time": 2.0832539765013510e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5631644421260320e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8457254157346911e+06, - "cpu_time": 2.0896987075719382e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5506906629398823e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8386895596229057e+06, - "cpu_time": 2.0848839336814159e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5642942869973391e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time_median", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8386862199089683e+06, - "cpu_time": 2.0835201409919816e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.5642840681780182e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4523233509777619e+03, - "cpu_time": 2.8101643653205456e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6171249909337508e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4214655093222383e-03, - "cpu_time": 1.3478756874290144e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4176244431806044e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 383, - "real_time": 1.8460500051705751e+06, - "cpu_time": 2.1031980339425984e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1001326959119365e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 383, - "real_time": 1.8409099172622659e+06, - "cpu_time": 2.0984541462141052e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1199572977979004e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 383, - "real_time": 1.8457955987859573e+06, - "cpu_time": 2.1029335953000896e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1011113086525142e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 383, - "real_time": 1.8367323625572002e+06, - "cpu_time": 2.0976406892951760e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1361512799564511e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 383, - "real_time": 1.8449120524287096e+06, - "cpu_time": 2.1023949582244596e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1045121000457466e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8428799872409417e+06, - "cpu_time": 2.1009242845952855e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1123729364729106e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time_median", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8449120524287098e+06, - "cpu_time": 2.1023949582244596e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 7.1045121000457466e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0110334782123814e+03, - "cpu_time": 2.6577118089620135e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5503004990565538e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1765028140641319e-03, - "cpu_time": 1.2650202715296737e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1797232975600427e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 381, - "real_time": 1.8497281179982151e+06, - "cpu_time": 2.1260759317586059e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4172028713262656e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 381, - "real_time": 1.8496760646516231e+06, - "cpu_time": 2.1262214304460655e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4172427540677154e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 381, - "real_time": 1.8495215221660777e+06, - "cpu_time": 2.1259530000000405e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4173611761651117e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 381, - "real_time": 1.8495080862796237e+06, - "cpu_time": 2.1261073569555297e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4173714726888031e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 381, - "real_time": 1.8482024730149573e+06, - "cpu_time": 2.1244876482940651e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4183727369023952e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8493272528220997e+06, - "cpu_time": 2.1257690734908609e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4175102022300583e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time_median", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8495215221660777e+06, - "cpu_time": 2.1260759317586059e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.4173611761651117e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3599007668374281e+02, - "cpu_time": 7.2268665647704006e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8769906653591206e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4390347933996697e-04, - "cpu_time": 3.3996479932331977e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4405330259256909e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 376, - "real_time": 1.8745907105535190e+06, - "cpu_time": 2.1887260797869693e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7968131765957117e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 376, - "real_time": 1.8736316541957848e+06, - "cpu_time": 2.1878461861703917e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.7982447821369624e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 376, - "real_time": 1.8712703040751449e+06, - "cpu_time": 2.1884626835105671e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8017758784406275e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 376, - "real_time": 1.8690281815113539e+06, - "cpu_time": 2.1853959494680637e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8051369432859194e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 376, - "real_time": 1.8693422704366620e+06, - "cpu_time": 2.1850824069150453e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8046656211199403e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8715726241544927e+06, - "cpu_time": 2.1871026611702074e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8013272803158325e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time_median", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8712703040751449e+06, - "cpu_time": 2.1878461861703913e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.8017758784406275e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4944194578583838e+03, - "cpu_time": 1.7343781513876831e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7329016515306162e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3327933020954878e-03, - "cpu_time": 7.9300262497038231e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3325474955249621e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 378, - "real_time": 1.8632101904749922e+06, - "cpu_time": 2.2627333994709835e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6277923197311652e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 378, - "real_time": 1.8698438682818846e+06, - "cpu_time": 2.2691242804231602e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6078265024527919e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 378, - "real_time": 1.8631861151396863e+06, - "cpu_time": 2.2631281613758132e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6278650397809899e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 378, - "real_time": 1.8710337567547206e+06, - "cpu_time": 2.2690301375661041e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6042601915357149e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 378, - "real_time": 1.8654701076066070e+06, - "cpu_time": 2.2637098862432856e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6209745507276988e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8665488076515782e+06, - "cpu_time": 2.2655451730158692e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6177437208456731e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time_median", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8654701076066073e+06, - "cpu_time": 2.2637098862432856e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.6209745507276988e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6942472974828715e+03, - "cpu_time": 3.2431189085995284e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1113173281470959e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9791860155700053e-03, - "cpu_time": 1.4314960245450869e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9782271733460323e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 367, - "real_time": 1.9078657352390930e+06, - "cpu_time": 2.4622459073568876e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0992136193153999e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 367, - "real_time": 1.9099740909440417e+06, - "cpu_time": 2.4634630953678596e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0980002346332572e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 367, - "real_time": 1.9108743326895812e+06, - "cpu_time": 2.4629891825613142e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0974829501468213e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 367, - "real_time": 1.9102726864110809e+06, - "cpu_time": 2.4636167929158215e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0978286057892697e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 367, - "real_time": 1.9087389648234730e+06, - "cpu_time": 2.4617291580382055e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0987107397338388e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9095451620214540e+06, - "cpu_time": 2.4628088272480173e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0982472299237173e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time_median", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9099740909440417e+06, - "cpu_time": 2.4629891825613142e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.0980002346332572e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2196715402702569e+03, - "cpu_time": 8.0560035590864686e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0162778918740095e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.3872358953747201e-04, - "cpu_time": 3.2710632956795016e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3886142397658041e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 351, - "real_time": 2.0102136735233911e+06, - "cpu_time": 2.8781618091170588e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0864966024474685e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 351, - "real_time": 2.0082120278165636e+06, - "cpu_time": 2.8730055270656822e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0885762767591197e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 351, - "real_time": 2.0067569964891695e+06, - "cpu_time": 2.8723533903134754e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0900906324671862e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 351, - "real_time": 2.0073445887302191e+06, - "cpu_time": 2.8741099059827859e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0894788187080429e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 351, - "real_time": 2.0070774304916675e+06, - "cpu_time": 2.8731373675216213e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0897569452378001e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0079209434102022e+06, - "cpu_time": 2.8741536000001249e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0888798551239235e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time_median", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0073445887302191e+06, - "cpu_time": 2.8731373675216213e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.0894788187080429e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3910259432335852e+03, - "cpu_time": 2.3269725137690302e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4462087818292351e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.9276927849116501e-04, - "cpu_time": 8.0962009607591235e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9233698543348643e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 339, - "real_time": 2.0649731907839708e+06, - "cpu_time": 3.6208482064896743e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0623326430767121e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 339, - "real_time": 2.0649514870531305e+06, - "cpu_time": 3.6227892802360379e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0623753403385224e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 339, - "real_time": 2.0608287617141125e+06, - "cpu_time": 3.6214728584070429e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0705021959333982e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 339, - "real_time": 2.0693932745089221e+06, - "cpu_time": 3.6234743746312754e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0536557759861574e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 339, - "real_time": 2.0633495871560059e+06, - "cpu_time": 3.6224496519174604e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0655292017492490e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0646992602432284e+06, - "cpu_time": 3.6222068743362986e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0628790314168077e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time_median", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0649514870531305e+06, - "cpu_time": 3.6224496519174604e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.0623753403385224e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1214901303798465e+03, - "cpu_time": 1.0475509876262365e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1391515236032410e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5118376755809582e-03, - "cpu_time": 2.8920241829594027e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5110347800491601e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 192, - "real_time": 3.6381991036857166e+06, - "cpu_time": 6.6759996458335044e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6114067762271891e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 192, - "real_time": 3.6357265998958610e+06, - "cpu_time": 6.6752971302085714e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6145427988123627e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 192, - "real_time": 3.6399115548798968e+06, - "cpu_time": 6.6772452135417387e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6092372704791126e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 192, - "real_time": 3.6382440885063261e+06, - "cpu_time": 6.6725962291661985e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6113497588029757e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 192, - "real_time": 3.6385982760596867e+06, - "cpu_time": 6.6792597708330937e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6109008819100513e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6381359246054976e+06, - "cpu_time": 6.6760795979166217e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6114874972463379e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time_median", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6382440885063261e+06, - "cpu_time": 6.6759996458335053e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 4.6113497588029757e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5155170987029474e+03, - "cpu_time": 2.4609279476111342e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9214573562377074e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1656417740007420e-04, - "cpu_time": 3.6861872473466402e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1666758445839202e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 96, - "real_time": 7.3817636924407752e+06, - "cpu_time": 1.3777454218749577e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5455846865378656e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 96, - "real_time": 7.3868886926599471e+06, - "cpu_time": 1.3756473593749283e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5424309741314611e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 96, - "real_time": 7.3819803074002266e+06, - "cpu_time": 1.3755504177083822e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5454513020527334e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 96, - "real_time": 7.3958270368166268e+06, - "cpu_time": 1.3817279052084075e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5369411470772820e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 96, - "real_time": 7.3892036501395823e+06, - "cpu_time": 1.3808806906250007e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5410078797011032e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3871326758914320e+06, - "cpu_time": 1.3783103589583356e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5422831979000893e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time_median", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3868886926599471e+06, - "cpu_time": 1.3777454218749579e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.5424309741314611e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8162113617005243e+03, - "cpu_time": 2.8859237532946678e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5749997369734170e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8734356304202427e-04, - "cpu_time": 2.0938127139055371e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8704906348114748e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52, - "real_time": 1.4487662943653189e+07, - "cpu_time": 2.6575477884613555e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6321386866195221e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52, - "real_time": 1.4534653952488532e+07, - "cpu_time": 2.6659296750000734e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6171628316276522e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52, - "real_time": 1.4473770673458394e+07, - "cpu_time": 2.6542975788458988e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6365847237763968e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52, - "real_time": 1.4485672223739900e+07, - "cpu_time": 2.6572343769229379e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6327752667230988e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52, - "real_time": 1.4505435354434527e+07, - "cpu_time": 2.6578438269229293e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6264632780900173e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4497439029554909e+07, - "cpu_time": 2.6585706492306393e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6290249573673372e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time_median", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4487662943653191e+07, - "cpu_time": 2.6575477884613559e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6321386866195221e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3680753552916212e+04, - "cpu_time": 4.3524283246113118e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5528541967762094e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6334439141037205e-03, - "cpu_time": 1.6371309620343757e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6316296123561494e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 25, - "real_time": 2.8028325513005257e+07, - "cpu_time": 5.0096969760006689e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7886459695111799e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 25, - "real_time": 2.8012460097670555e+07, - "cpu_time": 5.0064701999999665e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7913581146398926e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 25, - "real_time": 2.8027845397591591e+07, - "cpu_time": 5.0079308160002261e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7887279987470322e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 25, - "real_time": 2.7254094928503036e+07, - "cpu_time": 4.8781048399996512e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9246811663384809e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 25, - "real_time": 2.8017516061663628e+07, - "cpu_time": 5.0031099320003703e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7904934793148966e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7868048399686813e+07, - "cpu_time": 4.9810625528001770e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.8167813457102966e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time_median", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8017516061663628e+07, - "cpu_time": 5.0064701999999672e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.7904934793148966e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4327759133939643e+05, - "cpu_time": 5.7605902150586655e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0329001232821353e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2317963081449732e-02, - "cpu_time": 1.1564982679890791e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2524753959726413e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.4460106790065765e+07, - "cpu_time": 9.3962407300000459e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9290291889212036e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.4425880685448647e+07, - "cpu_time": 9.3926933800003096e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9321288442057152e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.3398819267749786e+07, - "cpu_time": 9.1091311800005317e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.0269923507863321e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.4418105259537697e+07, - "cpu_time": 9.3857332199991107e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9328335619137001e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.4504762962460518e+07, - "cpu_time": 9.3988104699997157e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9249907973158531e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4241534993052483e+07, - "cpu_time": 9.3365217959999427e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9491949486285610e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time_median", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4425880685448647e+07, - "cpu_time": 9.3926933800003096e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 4.9321288442057152e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7233271676589752e+05, - "cpu_time": 1.2721019351095692e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3600118931155220e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7079526201903432e-03, - "cpu_time": 1.3625009001259732e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8095375881762274e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 1.0650852415710688e+08, - "cpu_time": 1.8097749162501487e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0406379794360981e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 9.9188854917883873e+07, - "cpu_time": 1.7336862999999881e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4126132663237505e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 1.0663040727376938e+08, - "cpu_time": 1.8130245399999014e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0348763146107569e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 9.9353916011750698e+07, - "cpu_time": 1.7308065449998367e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4036210503922529e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 1.0659786686301231e+08, - "cpu_time": 1.8124795037499553e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0364132772931242e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0365591384470463e+08, - "cpu_time": 1.7799543609999660e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.1856323776111975e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time_median", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0650852415710688e+08, - "cpu_time": 1.8097749162501484e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.0406379794360981e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0031826440448249e+06, - "cpu_time": 4.3580467103129514e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0313572509215173e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8619915599242306e-02, - "cpu_time": 2.4484036252843198e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9172797124837413e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.9507104530930519e+08, - "cpu_time": 3.1270679149997705e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.5043628965922232e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.9528680667281151e+08, - "cpu_time": 3.1206743174999475e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.4982814368969345e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.9541329517960548e+08, - "cpu_time": 3.1276148174998754e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.4947224702040758e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.9522952660918236e+08, - "cpu_time": 3.1263332399998945e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.4998946247995358e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.9538485631346703e+08, - "cpu_time": 3.1267374200001544e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.4955222439416437e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9527710601687431e+08, - "cpu_time": 3.1256855419999284e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.4985567344868822e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time_median", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9528680667281151e+08, - "cpu_time": 3.1267374200001538e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.4982814368969345e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3690921482242667e+05, - "cpu_time": 2.8403956623203168e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8563899288324048e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPURdHost_fine/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.0110223166967682e-04, - "cpu_time": 9.0872726131718525e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0134584674650584e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_numa": NaN - } - ] -} diff --git a/results/implicit_managed_GPUWrGPU_coarse.json b/results/implicit_managed_GPUWrGPU_coarse.json deleted file mode 100644 index 0997eea..0000000 --- a/results/implicit_managed_GPUWrGPU_coarse.json +++ /dev/null @@ -1,25272 +0,0 @@ -{ - "context": { - "date": "2023-10-09T14:06:38-04:00", - "host_name": "frontier10485", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1795, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [2.13,2.48,2.18], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52603, - "real_time": 1.3321691730141269e+04, - "cpu_time": 2.5173792996597153e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0746845693272656e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52603, - "real_time": 1.3308491395705905e+04, - "cpu_time": 2.5173603862897558e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0777342662006062e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52603, - "real_time": 1.3305051256349116e+04, - "cpu_time": 2.4855893637245015e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0785300417729735e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52603, - "real_time": 1.3319280152750292e+04, - "cpu_time": 2.4969430640837985e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0752412690667963e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52603, - "real_time": 1.3306018095916816e+04, - "cpu_time": 2.5231592627796876e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0783063501596534e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3312106526172682e+04, - "cpu_time": 2.5080862753074918e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0768992993054593e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3308491395705903e+04, - "cpu_time": 2.5173603862897558e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0777342662006062e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7982696295497247e+00, - "cpu_time": 1.6045611351742340e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8021082076279438e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8580282648863227e-04, - "cpu_time": 6.3975515952995462e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8568969352839370e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52606, - "real_time": 1.3309076785971258e+04, - "cpu_time": 2.5168491236741047e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1551977885009778e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52606, - "real_time": 1.3308726789014810e+04, - "cpu_time": 2.5390058985667045e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1553596597698426e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52606, - "real_time": 1.3309715479913597e+04, - "cpu_time": 2.5118054613542176e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1549024187353861e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52606, - "real_time": 1.3305740521943466e+04, - "cpu_time": 2.5294375698589538e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1567411347680926e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52606, - "real_time": 1.3304073769861208e+04, - "cpu_time": 2.5440273352849497e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1575124594979310e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3307466669340869e+04, - "cpu_time": 2.5282250777477864e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1559426922544467e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3308726789014810e+04, - "cpu_time": 2.5294375698589538e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1553596597698426e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4356148089168075e+00, - "cpu_time": 1.3842179303777775e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1267938054497815e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8302618142401446e-04, - "cpu_time": 5.4750581447870050e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8304163339069745e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52594, - "real_time": 1.3309521309438478e+04, - "cpu_time": 2.5607132847853343e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2309984423242366e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52594, - "real_time": 1.3308149294797822e+04, - "cpu_time": 2.5516492926949821e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2311253531251361e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52594, - "real_time": 1.3309682828410350e+04, - "cpu_time": 2.5361988268623802e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2309835036059108e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52594, - "real_time": 1.3309442631160506e+04, - "cpu_time": 2.5287045366391605e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2310057193260100e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52594, - "real_time": 1.3308101000117293e+04, - "cpu_time": 2.5316552933794679e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2311298208403738e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3308979412784887e+04, - "cpu_time": 2.5417842468722651e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2310485678443334e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3309442631160506e+04, - "cpu_time": 2.5361988268623805e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2310057193260100e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8481231846838695e-01, - "cpu_time": 1.3788573536857695e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2594677490846399e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8968632689782321e-05, - "cpu_time": 5.4247615838460377e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8969791596415733e-05, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52607, - "real_time": 1.3307911356108500e+04, - "cpu_time": 2.5693408804911847e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4622947300410953e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52607, - "real_time": 1.3308522931192065e+04, - "cpu_time": 2.5425501549223492e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4621815786333036e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52607, - "real_time": 1.3309301742896567e+04, - "cpu_time": 2.5260941604729414e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4620375007643747e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52607, - "real_time": 1.3306622368203045e+04, - "cpu_time": 2.5413126352006402e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4625332479789205e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52607, - "real_time": 1.3302637519350748e+04, - "cpu_time": 2.5451912236014217e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4632709079183631e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3306999183550182e+04, - "cpu_time": 2.5448978109377076e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4624635930672116e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3307911356108500e+04, - "cpu_time": 2.5425501549223492e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4622947300410953e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6278198973652156e+00, - "cpu_time": 1.5568333122228145e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8636678307631164e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9747652052264853e-04, - "cpu_time": 6.1174688646895995e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9751227366188170e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52610, - "real_time": 1.3307320594182254e+04, - "cpu_time": 2.5706459019197824e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.9248080810987062e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52610, - "real_time": 1.3308059659430783e+04, - "cpu_time": 2.5691899695875341e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.9245345810843124e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52610, - "real_time": 1.3308157035057564e+04, - "cpu_time": 2.5752654058163771e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.9244985483233385e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52610, - "real_time": 1.3305496044016423e+04, - "cpu_time": 2.5660560862953844e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.9254834079990578e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52610, - "real_time": 1.3305781384797396e+04, - "cpu_time": 2.5627925622505230e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.9253777816369781e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3306962943496887e+04, - "cpu_time": 2.5687899851739210e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.9249404800284786e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3307320594182253e+04, - "cpu_time": 2.5691899695875341e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.9248080810987062e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2554311629892470e+00, - "cpu_time": 4.7164279859926843e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6464786219243496e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.4343928687557981e-05, - "cpu_time": 1.8360504413416877e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4345883788172832e-05, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52578, - "real_time": 1.3311947021827596e+04, - "cpu_time": 2.5951381186047482e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.8461930313485527e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52578, - "real_time": 1.3314524831299414e+04, - "cpu_time": 2.5585097398151258e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.8442867215118027e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52578, - "real_time": 1.3305106889480152e+04, - "cpu_time": 2.5664589676290532e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.8512549420879669e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52578, - "real_time": 1.3310557357393183e+04, - "cpu_time": 2.5614871999695781e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.8472210051518002e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52578, - "real_time": 1.3313116461628691e+04, - "cpu_time": 2.5978352942295347e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.8453281301773434e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3311050512325808e+04, - "cpu_time": 2.5758858640496084e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.8468567660554943e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3311947021827596e+04, - "cpu_time": 2.5664589676290532e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.8461930313485527e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6301729439563699e+00, - "cpu_time": 1.9043006508324237e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6860297274304316e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7271874151441999e-04, - "cpu_time": 7.3927990265788782e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7278042031542778e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51663, - "real_time": 1.3548690521392420e+04, - "cpu_time": 2.6229305053907057e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9348290492434914e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51663, - "real_time": 1.3546791887800320e+04, - "cpu_time": 2.5933087277161652e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9351002227772911e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51663, - "real_time": 1.3543270549193310e+04, - "cpu_time": 2.5873369684300218e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9356033614466507e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51663, - "real_time": 1.3547460953300699e+04, - "cpu_time": 2.5895856976946769e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9350046544044945e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51663, - "real_time": 1.3546206541319812e+04, - "cpu_time": 2.6152273929117651e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9351838405858181e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3546484090601312e+04, - "cpu_time": 2.6016778584286669e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9351442256915493e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3546791887800320e+04, - "cpu_time": 2.5933087277161649e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9351002227772911e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0199763975585405e+00, - "cpu_time": 1.6257219270663671e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8858602493121526e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4911444062153518e-04, - "cpu_time": 6.2487441394771795e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4912894920175019e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51504, - "real_time": 1.3593763372226567e+04, - "cpu_time": 2.6504293375271878e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8568274703911156e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51504, - "real_time": 1.3579308840087402e+04, - "cpu_time": 2.6215984428393898e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8609328808565887e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51504, - "real_time": 1.3595804397551365e+04, - "cpu_time": 2.6488858632339226e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8562484768788338e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51504, - "real_time": 1.3597649976324947e+04, - "cpu_time": 2.6563408667287928e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8557250768540520e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51504, - "real_time": 1.3594679940940838e+04, - "cpu_time": 2.6465099370922773e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8565674387161484e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3592241305426223e+04, - "cpu_time": 2.6447528894843144e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8572602687393486e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3594679940940836e+04, - "cpu_time": 2.6488858632339223e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8565674387161484e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3732902535716587e+00, - "cpu_time": 1.3442473421335441e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0937970578533154e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4246316614671442e-04, - "cpu_time": 5.0826954286668788e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4281975080142097e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51212, - "real_time": 1.3667810402811938e+04, - "cpu_time": 2.6652741330157038e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.6718652739305771e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51212, - "real_time": 1.3668213767530448e+04, - "cpu_time": 2.6565489611809800e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.6716388683570847e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51212, - "real_time": 1.3663752130771876e+04, - "cpu_time": 2.6526471041943212e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.6741438952081253e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51212, - "real_time": 1.3664480283503784e+04, - "cpu_time": 2.6506134694993412e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.6737349554807129e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51212, - "real_time": 1.3656064060919427e+04, - "cpu_time": 2.6585112102632309e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.6784642728850983e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3664064129107495e+04, - "cpu_time": 2.6567189756307151e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.6739694531723190e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3664480283503788e+04, - "cpu_time": 2.6565489611809800e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.6737349554807129e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8868620854826990e+00, - "cpu_time": 5.7072118824448715e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7453606050971154e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5764338042534470e-04, - "cpu_time": 2.1482181347727818e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5774974370822118e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50522, - "real_time": 1.3855203618468355e+04, - "cpu_time": 2.6975141839198604e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.5136204835016583e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50522, - "real_time": 1.3818814505079421e+04, - "cpu_time": 2.6939186433632920e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.5176063035140561e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50522, - "real_time": 1.3856704448562061e+04, - "cpu_time": 2.7069265250781878e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.5134565421272485e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50522, - "real_time": 1.3850417474158041e+04, - "cpu_time": 2.6912957701595296e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.5141435295454764e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50522, - "real_time": 1.3874888584744656e+04, - "cpu_time": 2.6956484422627691e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.5114730379210425e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3851205726202510e+04, - "cpu_time": 2.6970607129567285e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.5140599793218964e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3855203618468357e+04, - "cpu_time": 2.6956484422627691e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.5136204835016583e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0352576163340597e+01, - "cpu_time": 5.9716321057006837e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2267102838379097e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4693721662684832e-03, - "cpu_time": 2.2141259471886768e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4706882912493260e-03, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 42864, - "real_time": 1.6350391099072593e+04, - "cpu_time": 2.9800858785927474e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5652621852194742e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 42864, - "real_time": 1.6342253332231800e+04, - "cpu_time": 2.9808526222471228e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5665395797821722e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 42864, - "real_time": 1.6350432004097553e+04, - "cpu_time": 2.9601094438223219e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5652557675227618e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 42864, - "real_time": 1.6353474322628037e+04, - "cpu_time": 2.9679539986935441e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5647785401762671e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 42864, - "real_time": 1.6343344160198094e+04, - "cpu_time": 2.9692331117021298e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5663682774389801e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6347978983645615e+04, - "cpu_time": 2.9716470110115730e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5656408700279312e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6350391099072591e+04, - "cpu_time": 2.9692331117021298e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.5652621852194742e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9066035414390807e+00, - "cpu_time": 8.7826315928247396e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7008435522691146e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0013517550686884e-04, - "cpu_time": 2.9554760576475931e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0015282505946664e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 39453, - "real_time": 1.7726687496227842e+04, - "cpu_time": 3.1370318252097462e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7321915060470593e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 39453, - "real_time": 1.7734652237165436e+04, - "cpu_time": 3.1123630927939623e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7300662498588513e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 39453, - "real_time": 1.7726886168571433e+04, - "cpu_time": 3.1187868805920745e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7321384704734180e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 39453, - "real_time": 1.7739855122022247e+04, - "cpu_time": 3.1067833903632196e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7286789786610980e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 39453, - "real_time": 1.7745483643806441e+04, - "cpu_time": 3.1415502015055867e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7271791337892371e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7734712933558680e+04, - "cpu_time": 3.1233030780929177e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7300508677659326e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7734652237165436e+04, - "cpu_time": 3.1187868805920745e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7300662498588513e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.1871832747612334e+00, - "cpu_time": 1.5284104579061346e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1834370658359209e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6164735259226878e-04, - "cpu_time": 4.8935707476694167e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6160963737525043e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 29361, - "real_time": 2.3844876431288703e+04, - "cpu_time": 3.7710210789822981e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.0359836203576721e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 29361, - "real_time": 2.3820686605135255e+04, - "cpu_time": 3.7550972582677467e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.0431286377711597e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 29361, - "real_time": 2.3855442887392739e+04, - "cpu_time": 3.7318243281904215e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.0328671235303369e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 29361, - "real_time": 2.3867049604957083e+04, - "cpu_time": 3.7528120806512168e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.0294469897592383e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 29361, - "real_time": 2.3837682976407417e+04, - "cpu_time": 3.7400402540785341e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.0381068565282593e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3845147701036240e+04, - "cpu_time": 3.7501590000340439e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.0359066455893347e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3844876431288703e+04, - "cpu_time": 3.7528120806512175e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.0359836203576721e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7605575617003790e+01, - "cpu_time": 1.5043277406514250e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1954276071323609e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.3832948479655265e-04, - "cpu_time": 4.0113705595889891e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3841622250478097e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19194, - "real_time": 3.6425490241659914e+04, - "cpu_time": 5.0561420079191412e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 9.2117996977906750e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19194, - "real_time": 3.6427274712152532e+04, - "cpu_time": 5.0261795144315554e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 9.2113484374404431e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19194, - "real_time": 3.6435334708596849e+04, - "cpu_time": 5.0248884078357733e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 9.2093107606564392e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19194, - "real_time": 3.6433250847838834e+04, - "cpu_time": 5.0323102740439244e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 9.2098375025983716e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19194, - "real_time": 3.6439844979536254e+04, - "cpu_time": 5.0448311607793876e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 9.2081708961285010e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6432239097956881e+04, - "cpu_time": 5.0368702730019570e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 9.2100934589228870e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6433250847838834e+04, - "cpu_time": 5.0323102740439252e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 9.2098375025983716e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8874456716194006e+00, - "cpu_time": 1.3355022492415634e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4883379999551392e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6159988563397326e-04, - "cpu_time": 2.6514525426631821e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6159857732097314e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 11326, - "real_time": 6.1803466774049906e+04, - "cpu_time": 7.6959267437753297e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.0858430360443425e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 11326, - "real_time": 6.1839052262158199e+04, - "cpu_time": 7.6608877450115120e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.0852181840611198e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 11326, - "real_time": 6.1824006624125432e+04, - "cpu_time": 7.6637296485961298e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.0854822853524390e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 11326, - "real_time": 6.1850651000712031e+04, - "cpu_time": 7.6566658926363452e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.0850146750957794e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 11326, - "real_time": 6.1822213159354229e+04, - "cpu_time": 7.6663222850079488e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.0855137752351050e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1827877964079962e+04, - "cpu_time": 7.6687064630054534e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.0854143911577571e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1824006624125432e+04, - "cpu_time": 7.6637296485961298e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.0854822853524390e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7933624963990024e+01, - "cpu_time": 1.5632533043450354e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1483861356062967e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9005726145750775e-04, - "cpu_time": 2.0384836893761857e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9006305437392178e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6243, - "real_time": 1.1203101041936215e+05, - "cpu_time": 1.2968518500720811e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.1980408593798003e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6243, - "real_time": 1.1196514529381139e+05, - "cpu_time": 1.2970966282236220e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.1987456243440303e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6243, - "real_time": 1.1196852835303928e+05, - "cpu_time": 1.2983866554541224e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.1987094049928789e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6243, - "real_time": 1.1203157595811471e+05, - "cpu_time": 1.2946309594746078e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.1980348116336418e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6243, - "real_time": 1.1201514631204188e+05, - "cpu_time": 1.2964515329168760e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.1982105315124807e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1200228126727389e+05, - "cpu_time": 1.2966835252282617e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.1983482463725664e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1201514631204188e+05, - "cpu_time": 1.2968518500720810e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.1982105315124807e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3043124152135043e+01, - "cpu_time": 1.3570636048786619e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5356692546425909e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9502188507467449e-04, - "cpu_time": 1.0465650087131098e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9504522290120256e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3255, - "real_time": 2.1511319738697581e+05, - "cpu_time": 2.4584597480798801e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2478799964890142e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3255, - "real_time": 2.1528204244571508e+05, - "cpu_time": 2.4621775422426782e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2469012879589709e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3255, - "real_time": 2.1505828838371250e+05, - "cpu_time": 2.4573058801843008e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2481986070727515e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3255, - "real_time": 2.1493896566969436e+05, - "cpu_time": 2.4549455944700417e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2488915407386667e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3255, - "real_time": 2.1500800645136961e+05, - "cpu_time": 2.4560504700460861e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2484905117275925e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1508010006749351e+05, - "cpu_time": 2.4577878470045974e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2480723887973992e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1505828838371247e+05, - "cpu_time": 2.4573058801843008e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2481986070727515e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2987331707942468e+02, - "cpu_time": 2.7861283852200074e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5336905232412601e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.0383697533462931e-04, - "cpu_time": 1.1335918959057313e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0362608698526470e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1574, - "real_time": 4.5693562562953745e+05, - "cpu_time": 5.2882824142312328e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.1749377415261345e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1574, - "real_time": 4.4407198281622614e+05, - "cpu_time": 5.1513982274460356e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2089727178806899e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1574, - "real_time": 4.5712358042245125e+05, - "cpu_time": 5.2877162388818164e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.1744546441989500e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1574, - "real_time": 4.4352997580245545e+05, - "cpu_time": 5.1447880559084564e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2104501190222100e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1574, - "real_time": 4.5738950792730827e+05, - "cpu_time": 5.2865456162643898e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.1737718130721169e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5181013451959565e+05, - "cpu_time": 5.2317461105463858e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.1885174071400203e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5693562562953739e+05, - "cpu_time": 5.2865456162643910e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.1749377415261345e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3156133418275513e+03, - "cpu_time": 7.6402683709884823e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9358878790762802e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6191786732730456e-02, - "cpu_time": 1.4603668086237764e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6288258526517413e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 713, - "real_time": 9.8514944345325872e+05, - "cpu_time": 1.2362175610098341e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.0899278593064998e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 713, - "real_time": 9.8846185179152968e+05, - "cpu_time": 1.2388727671809245e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.0862754309171420e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 713, - "real_time": 9.8053502811374969e+05, - "cpu_time": 1.2307994544179323e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.0950570792616676e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 713, - "real_time": 9.8390446550984774e+05, - "cpu_time": 1.2345148120617340e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.0913069933508226e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 713, - "real_time": 9.8385197273096361e+05, - "cpu_time": 1.2346355582047568e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.0913652193220911e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8438055231986998e+05, - "cpu_time": 1.2350080305750365e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.0907865164316445e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8390446550984774e+05, - "cpu_time": 1.2346355582047568e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.0913069933508226e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8522933932074789e+03, - "cpu_time": 2.9365484136840705e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1595365452517433e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8975515480121343e-03, - "cpu_time": 2.3777565335480243e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8965672912677040e-03, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2670796795063997e+06, - "cpu_time": 2.5666702977347067e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8067296165310794e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2674140695205205e+06, - "cpu_time": 2.5762048252427438e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8064631665914299e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2672841455003782e+06, - "cpu_time": 2.5668267443365087e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8065666838137014e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2743660911411336e+06, - "cpu_time": 2.5793663527508304e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8009413770079932e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2684072813435085e+06, - "cpu_time": 2.5669491100322967e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8056722149005199e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2689102534023882e+06, - "cpu_time": 2.5712034660194172e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8052746117689447e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2674140695205205e+06, - "cpu_time": 2.5669491100322967e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8064631665914299e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0924480683726006e+03, - "cpu_time": 6.1125110656488851e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4563266954867663e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3629662362075630e-03, - "cpu_time": 2.3772957474703107e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3606388077877368e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2667756810494997e+06, - "cpu_time": 2.5792763203883255e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6139438359454991e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2674089419718795e+06, - "cpu_time": 2.5682626148866829e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6129345035023671e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2741242946339562e+06, - "cpu_time": 2.5800385631067539e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6022657245823881e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2671702800131734e+06, - "cpu_time": 2.5682880258900444e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6133148322464782e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2791438799315286e+06, - "cpu_time": 2.5804691391585637e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.5943320964212706e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2709246155200074e+06, - "cpu_time": 2.5752669326860742e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6073581985396007e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2674089419718790e+06, - "cpu_time": 2.5792763203883255e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6129345035023671e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5105105646502716e+03, - "cpu_time": 6.3967219477509625e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7401360059408544e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4265493125532251e-03, - "cpu_time": 2.4839063735730906e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4228633600841751e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2754470671091666e+06, - "cpu_time": 2.5778960616883063e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2003432805910064e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2821940970002348e+06, - "cpu_time": 2.5908090194804813e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1790563394829053e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2759208343802141e+06, - "cpu_time": 2.5791892597402688e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1988444204658559e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2755249822209892e+06, - "cpu_time": 2.5899425616883636e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2000967372411191e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2746938161322144e+06, - "cpu_time": 2.5769317792207748e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2027276303316308e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2767561593685639e+06, - "cpu_time": 2.5829537363636391e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1962136816225043e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2755249822209887e+06, - "cpu_time": 2.5791892597402688e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2000967372411191e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0721211261222816e+03, - "cpu_time": 6.8294303837106345e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6935340885045644e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3493413045050483e-03, - "cpu_time": 2.6440389882187031e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3470325531410566e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 306, - "real_time": 2.3035851689177305e+06, - "cpu_time": 2.6105558627450382e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4224783369045153e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 306, - "real_time": 2.2895239777497803e+06, - "cpu_time": 2.5957540032679718e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4312145371024013e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 306, - "real_time": 2.2892139500518348e+06, - "cpu_time": 2.6066535130718676e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4314083661449833e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 306, - "real_time": 2.2894649315941958e+06, - "cpu_time": 2.5955676470587626e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4312514486597989e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 306, - "real_time": 2.2897624488299093e+06, - "cpu_time": 2.5968571862745527e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4310654809080638e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2923100954286903e+06, - "cpu_time": 2.6010776424836391e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4294836339439524e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2895239777497803e+06, - "cpu_time": 2.5968571862745532e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4312145371024013e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3059755498065861e+03, - "cpu_time": 7.0256748221957478e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9179782761349794e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7509260472140841e-03, - "cpu_time": 2.7010630930214300e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7408346504291608e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 302, - "real_time": 2.3203473746320172e+06, - "cpu_time": 2.6366761655629189e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8244046868367426e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 302, - "real_time": 2.3270356299244608e+06, - "cpu_time": 2.6436129271523566e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8162869170218680e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 302, - "real_time": 2.3266324790391997e+06, - "cpu_time": 2.6432051854304341e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8167749135464482e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 302, - "real_time": 2.3210685228349161e+06, - "cpu_time": 2.6382064470198727e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8235271537763726e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 302, - "real_time": 2.3206134060003012e+06, - "cpu_time": 2.6500457649005787e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8240809016506862e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3231394824861791e+06, - "cpu_time": 2.6423492980132326e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8210149145664241e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3210685228349161e+06, - "cpu_time": 2.6432051854304341e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8235271537763726e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3855129719143033e+03, - "cpu_time": 5.2657513843494680e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1089459751331000e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4573007765729124e-03, - "cpu_time": 1.9928294068875590e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4565488306766449e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 294, - "real_time": 2.3970377115139952e+06, - "cpu_time": 2.7338352006802983e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4680825157820940e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 294, - "real_time": 2.3829517418797426e+06, - "cpu_time": 2.7195769251700412e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5004051360522538e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 294, - "real_time": 2.3934828904679134e+06, - "cpu_time": 2.7312682857142533e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4762037582134590e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 294, - "real_time": 2.3826447641793764e+06, - "cpu_time": 2.7189858401360498e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5011138030533656e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 294, - "real_time": 2.3949033625069121e+06, - "cpu_time": 2.7319517755101947e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4729556963333093e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3902040941095883e+06, - "cpu_time": 2.7271236054421673e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4837521818868965e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3934828904679134e+06, - "cpu_time": 2.7312682857142533e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4762037582134590e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8788087216619097e+03, - "cpu_time": 7.2234119140095881e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5794207862773619e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8779168852626539e-03, - "cpu_time": 2.6487291956971658e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8801826448216724e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 281, - "real_time": 2.5006308439071705e+06, - "cpu_time": 2.8724424128114278e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0483114716381201e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 281, - "real_time": 2.4999173762429226e+06, - "cpu_time": 2.8660583416369581e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0486106560608460e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 281, - "real_time": 2.4999048456456843e+06, - "cpu_time": 2.8674104021352460e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0486159121480182e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 281, - "real_time": 2.5009178080897634e+06, - "cpu_time": 2.8728240604982683e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0481911846604401e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 281, - "real_time": 2.5079441513680583e+06, - "cpu_time": 2.8760263594305874e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0452545358994660e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5018630050507202e+06, - "cpu_time": 2.8709523153024977e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0477967520813781e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5006308439071709e+06, - "cpu_time": 2.8724424128114283e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0483114716381201e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4282582538100878e+03, - "cpu_time": 4.1220708268699800e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4332514869170729e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3702821644866947e-03, - "cpu_time": 1.4357851939577262e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3678716641085352e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 271, - "real_time": 2.5869171123099392e+06, - "cpu_time": 3.0228486715866379e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0266903701906660e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 271, - "real_time": 2.5915399991058335e+06, - "cpu_time": 3.0242269815498041e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0230750834673461e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 271, - "real_time": 2.5880837630879176e+06, - "cpu_time": 3.0244113763837893e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0257767831071156e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 271, - "real_time": 2.5918635495034531e+06, - "cpu_time": 3.0252947970479256e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0228225367050770e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 271, - "real_time": 2.5862269326907024e+06, - "cpu_time": 3.0235690405904138e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0272312277505070e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5889262713395692e+06, - "cpu_time": 3.0240701734317141e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0251192002441421e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5880837630879176e+06, - "cpu_time": 3.0242269815498041e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0257767831071156e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6216476282217868e+03, - "cpu_time": 9.1977064119422482e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0502882251039729e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0126389682257296e-03, - "cpu_time": 3.0414990011639492e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0124284164886672e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 254, - "real_time": 2.7583688690041113e+06, - "cpu_time": 3.3293830944882119e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8014350139420646e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 254, - "real_time": 2.7589911803984502e+06, - "cpu_time": 3.3255089409448416e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8005775714316201e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 254, - "real_time": 2.7533092968693869e+06, - "cpu_time": 3.3203689803149845e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8084206565251100e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 254, - "real_time": 2.7606869978082227e+06, - "cpu_time": 3.3275563661417696e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7982429765941966e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 254, - "real_time": 2.7528507314167740e+06, - "cpu_time": 3.3217880275590844e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8090550571201622e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7568414150993889e+06, - "cpu_time": 3.3249210818897784e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8035462551226306e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7583688690041108e+06, - "cpu_time": 3.3255089409448416e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8014350139420646e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5406400581398325e+03, - "cpu_time": 3.7992603220103797e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8862530073666875e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2843103846117265e-03, - "cpu_time": 1.1426618041264914e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2846571803316086e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 226, - "real_time": 3.0865244890884622e+06, - "cpu_time": 3.9808283185839904e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7945419108576334e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 226, - "real_time": 3.0896601120867166e+06, - "cpu_time": 3.9853933141593430e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7876462909171283e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 226, - "real_time": 3.0853280733726854e+06, - "cpu_time": 3.9747017566371276e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7971766701215863e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 226, - "real_time": 3.0840615179406200e+06, - "cpu_time": 3.9767947522124313e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7999681193142080e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 226, - "real_time": 3.0845981369421412e+06, - "cpu_time": 3.9814460132743530e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7987851476788235e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0860344658861253e+06, - "cpu_time": 3.9798328309734492e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7956236277778769e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0853280733726854e+06, - "cpu_time": 3.9808283185839904e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7971766701215863e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2271050675102497e+03, - "cpu_time": 4.1853964084884601e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9012694820831879e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.2167213040854944e-04, - "cpu_time": 1.0516513095512937e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2123910189032499e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 193, - "real_time": 3.6207069847925804e+06, - "cpu_time": 5.0414142020723978e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1584212745236216e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 193, - "real_time": 3.6230978768299590e+06, - "cpu_time": 5.0441273160622930e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1576568292076669e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 193, - "real_time": 3.6155173996550278e+06, - "cpu_time": 5.0320746839378541e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1600840312371881e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 193, - "real_time": 3.6199467794709099e+06, - "cpu_time": 5.0399806113989186e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1586645482708001e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 193, - "real_time": 3.6216372180093136e+06, - "cpu_time": 5.0400590673574433e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1581237289983068e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6201812517515579e+06, - "cpu_time": 5.0395311761657810e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1585900824475167e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6207069847925799e+06, - "cpu_time": 5.0400590673574423e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1584212745236216e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8596078598272461e+03, - "cpu_time": 4.4930564766321795e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1574715532181703e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8990737230178116e-04, - "cpu_time": 8.9156239331981382e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9039788894731862e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 142, - "real_time": 4.9269542452210272e+06, - "cpu_time": 7.6438902323944131e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7025950683704147e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 142, - "real_time": 5.0513068194383048e+06, - "cpu_time": 7.8420754366197316e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6606807505177040e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 142, - "real_time": 5.0416116169850593e+06, - "cpu_time": 7.8366178873238433e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6638742999835601e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 142, - "real_time": 5.0804420295630544e+06, - "cpu_time": 7.8861314366195574e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6511571141225021e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 142, - "real_time": 5.0537107630409822e+06, - "cpu_time": 7.8547196056338008e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6598907997165041e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0308050948496852e+06, - "cpu_time": 7.8126869197182683e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6676396065421371e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0513068194383057e+06, - "cpu_time": 7.8420754366197316e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6606807505177040e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9813450668306803e+04, - "cpu_time": 9.6293226054520259e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0101020408550408e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1889439073984629e-02, - "cpu_time": 1.2325238044735658e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2053575802406144e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 88, - "real_time": 7.9947488636455750e+06, - "cpu_time": 1.3785636227272781e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0985294580409937e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 88, - "real_time": 7.9880071518180724e+06, - "cpu_time": 1.3770164488636347e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1003005732389088e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 88, - "real_time": 8.0053869910030207e+06, - "cpu_time": 1.3793057227272825e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0957407829072270e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 88, - "real_time": 7.9934634850360453e+06, - "cpu_time": 1.3778409954545431e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0988669093700559e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 88, - "real_time": 7.9996634740382433e+06, - "cpu_time": 1.3789873750000160e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0972402219728417e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9962539931081925e+06, - "cpu_time": 1.3783428329545507e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0981355891060057e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9947488636455741e+06, - "cpu_time": 1.3785636227272782e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0985294580409937e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5783537452286928e+03, - "cpu_time": 9.2228993833490913e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7258257005850852e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.2267943850938732e-04, - "cpu_time": 6.6912956362092573e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2255203598183193e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3587726736623866e+07, - "cpu_time": 2.4966120921568383e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4694662065552583e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3593809770456716e+07, - "cpu_time": 2.4989778803921591e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4683611560405602e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3599309321565956e+07, - "cpu_time": 2.4964482882352866e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4673629525279613e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3545812965900291e+07, - "cpu_time": 2.4950941823529512e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4771072865444574e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3614079586285003e+07, - "cpu_time": 2.4946698352940913e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4646860470687394e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3588147676166365e+07, - "cpu_time": 2.4963604556862652e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4693967297473950e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3593809770456716e+07, - "cpu_time": 2.4964482882352866e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4683611560405602e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5600344165761271e+04, - "cpu_time": 1.6869790322950699e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6598472918498088e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8840201605009280e-03, - "cpu_time": 6.7577541875109878e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8870387393468704e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.4680016163204398e+07, - "cpu_time": 4.7669534357142746e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7191580247039328e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.4752084831041951e+07, - "cpu_time": 4.7713217035713740e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7112408695302224e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.4812113826296158e+07, - "cpu_time": 4.7765899785714187e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7046814499487453e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.4774759475673947e+07, - "cpu_time": 4.7756220250000015e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7087594560057554e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.4701176344283991e+07, - "cpu_time": 4.7670755535714343e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7168286669687057e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4744030128100090e+07, - "cpu_time": 4.7715125392857008e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7121336934314728e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4752084831041947e+07, - "cpu_time": 4.7713217035713740e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7112408695302224e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3802405826294307e+04, - "cpu_time": 4.5600698575039205e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8970872465107720e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1743590493447798e-03, - "cpu_time": 9.5568644532715956e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1743350118738434e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 16, - "real_time": 4.4985790038481355e+07, - "cpu_time": 8.7245433562500805e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9835583166415133e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 16, - "real_time": 4.4974370393902063e+07, - "cpu_time": 8.7138127750000298e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9843158853469615e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 16, - "real_time": 4.4997719582170248e+07, - "cpu_time": 8.6632033062500119e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9827673323512597e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 16, - "real_time": 4.5002229977399111e+07, - "cpu_time": 8.7162758999998152e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9824683813981314e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 16, - "real_time": 4.4901730027049780e+07, - "cpu_time": 8.6987477562498584e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9891438017899160e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4972368003800511e+07, - "cpu_time": 8.7033166187499598e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9844507435055566e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4985790038481355e+07, - "cpu_time": 8.7138127750000298e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9835583166415133e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0952180436629285e+04, - "cpu_time": 2.4282910635153399e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7204338406952666e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.1060760761293481e-04, - "cpu_time": 2.7900755193531164e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1153584846899709e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.5514955222606659e+07, - "cpu_time": 1.6462495875000373e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1390469105810471e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.4206132218241692e+07, - "cpu_time": 1.6127975512499404e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1878373810624738e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.5413591004908085e+07, - "cpu_time": 1.6443795149999830e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1427721612193427e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.5475795902311802e+07, - "cpu_time": 1.6440126887500384e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1404850129361572e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.5597071796655655e+07, - "cpu_time": 1.6462222850000075e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1360355017481799e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5241509228944793e+07, - "cpu_time": 1.6387323255000013e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1492353935094404e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5475795902311802e+07, - "cpu_time": 1.6443795149999827e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1404850129361572e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8260307848157547e+05, - "cpu_time": 1.4534392161275942e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1716919105486397e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8347344357406739e-03, - "cpu_time": 8.8692899597506182e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8959338988266380e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6659506782889366e+08, - "cpu_time": 3.1118044749999285e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2226098827331972e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6362842544913292e+08, - "cpu_time": 3.0698701099998969e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2810369624127245e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6655986011028290e+08, - "cpu_time": 3.1119765725000548e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2232910837252512e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6415042430162430e+08, - "cpu_time": 3.0760170949999124e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2706032548140516e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6660086438059807e+08, - "cpu_time": 3.1109224450000286e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2224977583160887e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6550692841410640e+08, - "cpu_time": 3.0961181394999641e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2440077884002633e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6655986011028290e+08, - "cpu_time": 3.1109224450000280e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2232910837252512e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4881435782711054e+06, - "cpu_time": 2.1270457932349737e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9275468294862852e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.9914276854180866e-03, - "cpu_time": 6.8700407975339746e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0244753417499154e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.1615597009658813e+08, - "cpu_time": 5.5545824199998605e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3962408607117667e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.1564435362815857e+08, - "cpu_time": 5.5323487500001538e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.4017457041696682e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.1797873973846436e+08, - "cpu_time": 5.5704255500000954e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3767723744145484e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.1614874303340912e+08, - "cpu_time": 5.5434776350000453e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3963184977348843e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.1524586677551270e+08, - "cpu_time": 5.5430723699998903e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.4060456842234001e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1623473465442657e+08, - "cpu_time": 5.5487813450000083e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3954246242508540e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1614874303340912e+08, - "cpu_time": 5.5434776350000453e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3963184977348843e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0466089988274320e+06, - "cpu_time": 1.4429795520076875e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1204180492027072e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.3095953231422862e-03, - "cpu_time": 2.6005341755049550e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2997877237516634e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2671459435596820e+06, - "cpu_time": 2.5768962524271961e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8066768095082599e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2662962269954216e+06, - "cpu_time": 2.5772360582523164e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8073541981007212e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2711133490946493e+06, - "cpu_time": 2.5761892297734967e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8035207276787038e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2666245249844487e+06, - "cpu_time": 2.5796639061488574e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8070924208446492e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2672645116230911e+06, - "cpu_time": 2.5805142750809379e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8065823281765003e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2676889112514583e+06, - "cpu_time": 2.5780999443365606e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8062452968617671e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2671459435596820e+06, - "cpu_time": 2.5772360582523164e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8066768095082599e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9541104790882480e+03, - "cpu_time": 1.8788941575709184e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5548594391025226e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.6171893745771457e-04, - "cpu_time": 7.2879027118338770e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6082407622264207e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2770649275793708e+06, - "cpu_time": 2.5859992556632683e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.5976137091130242e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2754224641158166e+06, - "cpu_time": 2.5836218543688417e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6002105671323091e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2678403138608029e+06, - "cpu_time": 2.5827201294497689e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6122472776991185e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2673561436675708e+06, - "cpu_time": 2.5750315922330343e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6130186353296041e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2742185820026691e+06, - "cpu_time": 2.5889745533978785e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6021163773915493e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2723804862452457e+06, - "cpu_time": 2.5832694770225585e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6050413133331211e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2742185820026691e+06, - "cpu_time": 2.5836218543688417e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6021163773915493e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4842334796919295e+03, - "cpu_time": 5.2030828897694555e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1173072900868510e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9733638388619618e-03, - "cpu_time": 2.0141463893137697e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9742651114048916e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2758668161589992e+06, - "cpu_time": 2.5938402272727261e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1990152866903804e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2799468337703352e+06, - "cpu_time": 2.5915577954543927e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1861324822675241e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2730460456971610e+06, - "cpu_time": 2.5835216753247413e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2079490123020792e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2811463008961314e+06, - "cpu_time": 2.5989386948052384e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1823538865366364e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2748782255614251e+06, - "cpu_time": 2.5866417824675278e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2021437525327485e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2769768444168102e+06, - "cpu_time": 2.5909000350649254e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1955188840658739e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2758668161589988e+06, - "cpu_time": 2.5915577954543922e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1990152866903804e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4384860948487244e+03, - "cpu_time": 6.0471137123654462e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0863281043914058e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5101102601372323e-03, - "cpu_time": 2.3339818713669176e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5097286545894923e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 306, - "real_time": 2.2895203072431623e+06, - "cpu_time": 2.6112562679740228e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4312168315928293e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 306, - "real_time": 2.2909995001052916e+06, - "cpu_time": 2.6079740588236633e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4302927608013021e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 306, - "real_time": 2.2962371776111764e+06, - "cpu_time": 2.6185580751633979e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4270302876155518e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 306, - "real_time": 2.2903459201402524e+06, - "cpu_time": 2.6070617843137509e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4307009134233054e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 306, - "real_time": 2.2898732412156034e+06, - "cpu_time": 2.6127115718954317e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4309962407615524e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2913952292630975e+06, - "cpu_time": 2.6115123516340535e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4300474068389082e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2903459201402524e+06, - "cpu_time": 2.6112562679740223e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4307009134233054e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7628741921298292e+03, - "cpu_time": 4.5681777991406507e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7217809020341047e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2057606461100810e-03, - "cpu_time": 1.7492461011269157e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2040026741771224e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 301, - "real_time": 2.3292334915828765e+06, - "cpu_time": 2.6565222691029189e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8136294723919552e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 301, - "real_time": 2.3254577915162542e+06, - "cpu_time": 2.6638578372093849e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8181977862203624e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 301, - "real_time": 2.3252499781771754e+06, - "cpu_time": 2.6510347906976654e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8184496555237215e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 301, - "real_time": 2.3359445223826109e+06, - "cpu_time": 2.6628161727574728e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8055460809126899e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 301, - "real_time": 2.3320678217751146e+06, - "cpu_time": 2.6580954850497437e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8102098655996874e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3295907210868066e+06, - "cpu_time": 2.6584653109634374e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8132065721296836e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3292334915828765e+06, - "cpu_time": 2.6580954850497437e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8136294723919552e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5430602981990578e+03, - "cpu_time": 5.1752814407124943e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4827995111701377e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9501538433667946e-03, - "cpu_time": 1.9467176868435245e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9489501999206159e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 294, - "real_time": 2.3935252181286006e+06, - "cpu_time": 2.7479169965987983e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4761069157432914e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 294, - "real_time": 2.3838990988830724e+06, - "cpu_time": 2.7314100782312341e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4982192854307935e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 294, - "real_time": 2.3909151699824804e+06, - "cpu_time": 2.7431363401359902e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4820849206858493e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 294, - "real_time": 2.3823758368665464e+06, - "cpu_time": 2.7264440918366471e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5017347796976604e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 294, - "real_time": 2.3810751340193609e+06, - "cpu_time": 2.7254135170067945e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5047401960283637e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3863580915760128e+06, - "cpu_time": 2.7348642047618935e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4925772195171922e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3838990988830728e+06, - "cpu_time": 2.7314100782312346e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4982192854307935e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5215329574489970e+03, - "cpu_time": 1.0135931002966701e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2698337046637248e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3137906154739891e-03, - "cpu_time": 3.7061916951189795e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3119086977084783e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 280, - "real_time": 2.4894991174473292e+06, - "cpu_time": 2.8713887714285338e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0529989673938745e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 280, - "real_time": 2.4954671514154011e+06, - "cpu_time": 2.8715705928569995e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0504806679234982e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 280, - "real_time": 2.4966214334459179e+06, - "cpu_time": 2.8695300000001513e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0499949911836669e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 280, - "real_time": 2.4911653874109364e+06, - "cpu_time": 2.8676252321428056e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0522946462115298e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 280, - "real_time": 2.4933665641583502e+06, - "cpu_time": 2.8696118892857009e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0513656666784099e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4932239307755874e+06, - "cpu_time": 2.8699452971428381e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0514269878781958e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4933665641583502e+06, - "cpu_time": 2.8696118892857013e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0513656666784099e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9456426560410355e+03, - "cpu_time": 1.6117954498687179e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2423613465896306e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1814593224783907e-03, - "cpu_time": 5.6161190649638300e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1815954516221281e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 270, - "real_time": 2.5942266806615172e+06, - "cpu_time": 3.0379723814814109e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0209799086111808e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 270, - "real_time": 2.5968951759514986e+06, - "cpu_time": 3.0371023407408553e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0189032073961231e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 270, - "real_time": 2.5938130803061305e+06, - "cpu_time": 3.0386170444444362e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0213021669939369e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 270, - "real_time": 2.5963363444639575e+06, - "cpu_time": 3.0369559222221039e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0193377530531201e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 270, - "real_time": 2.5933621054584230e+06, - "cpu_time": 3.0378517222223529e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0216536630056247e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5949266773683052e+06, - "cpu_time": 3.0376998822222319e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0204353398119974e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5942266806615172e+06, - "cpu_time": 3.0378517222223524e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0209799086111808e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5843079769311919e+03, - "cpu_time": 6.7989522471946566e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2333270417857544e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1054055621253558e-04, - "cpu_time": 2.2381909045672007e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1042638558307747e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 255, - "real_time": 2.7524577627214147e+06, - "cpu_time": 3.3322805372550008e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8095988763266259e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 255, - "real_time": 2.7576373707430037e+06, - "cpu_time": 3.3368383568628421e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8024433927564490e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 255, - "real_time": 2.7482054954139041e+06, - "cpu_time": 3.3290799529410442e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8154934256183600e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 255, - "real_time": 2.7579529667455778e+06, - "cpu_time": 3.3358097568628751e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8020082744098938e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 255, - "real_time": 2.7508483341365471e+06, - "cpu_time": 3.3296997372549055e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8118277441461837e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7534203859520894e+06, - "cpu_time": 3.3327416682353341e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8082743426515031e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7524577627214147e+06, - "cpu_time": 3.3322805372550003e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8095988763266259e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2738866013456736e+03, - "cpu_time": 3.5025051853838022e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9110024192179111e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5522099796859863e-03, - "cpu_time": 1.0509380966327213e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5521472161331706e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 226, - "real_time": 3.1003558295325632e+06, - "cpu_time": 4.0072112566372100e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7642300281261098e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 226, - "real_time": 3.0970439382837014e+06, - "cpu_time": 4.0073835796461850e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7714635045254970e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 226, - "real_time": 3.0934835652268566e+06, - "cpu_time": 4.0089389292036351e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7792569631647873e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 226, - "real_time": 3.0962297830944965e+06, - "cpu_time": 4.0121270752211055e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7732440642826653e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 226, - "real_time": 3.0973179140169406e+06, - "cpu_time": 4.0086557477876195e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7708645293055630e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0968862060309118e+06, - "cpu_time": 4.0088633176991506e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7718118178809249e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0970439382837014e+06, - "cpu_time": 4.0086557477876195e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7714635045254970e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4626405543010410e+03, - "cpu_time": 1.9760975412514558e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3847871772243700e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.9519891609361243e-04, - "cpu_time": 4.9293213179081856e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9517672995665272e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 192, - "real_time": 3.6501529599869777e+06, - "cpu_time": 5.1268900364582017e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1490762294013464e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 192, - "real_time": 3.6505579567650179e+06, - "cpu_time": 5.1304449114584951e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1489487496636894e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 192, - "real_time": 3.6481537972576916e+06, - "cpu_time": 5.1239622968749879e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1497059151269467e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 192, - "real_time": 3.6491854176953589e+06, - "cpu_time": 5.1267491614582399e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1493808946131628e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 192, - "real_time": 3.6489745786335939e+06, - "cpu_time": 5.1244223854164751e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1494473062540796e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6494049420677284e+06, - "cpu_time": 5.1264937583332798e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1493118190118451e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6491854176953593e+06, - "cpu_time": 5.1267491614582408e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1493808946131628e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6017454944186704e+02, - "cpu_time": 2.5754980591773465e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0239121786189493e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6310441419467103e-04, - "cpu_time": 5.0238977761180178e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6310633272864518e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 139, - "real_time": 4.9761741743724551e+06, - "cpu_time": 7.7605763525178023e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6857544985466442e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 139, - "real_time": 4.9780676469689226e+06, - "cpu_time": 7.7474725035968600e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6851132999584105e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 139, - "real_time": 5.4736043386858143e+06, - "cpu_time": 8.4399183381297905e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.5325565168661904e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 139, - "real_time": 4.9167989833588656e+06, - "cpu_time": 7.6660342374101048e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7061116446679301e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 139, - "real_time": 4.9057220638119914e+06, - "cpu_time": 7.6577349496403309e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7099639749019191e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0500734414396090e+06, - "cpu_time": 7.8543472762589771e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6638999869882190e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9761741743724551e+06, - "cpu_time": 7.7474725035968600e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6857544985466442e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3907308424011533e+05, - "cpu_time": 3.3061566782678844e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4300818455964804e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7340516333553254e-02, - "cpu_time": 4.2093334582509141e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4654618088227002e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 87, - "real_time": 7.8046692203430608e+06, - "cpu_time": 1.3326178494252674e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1496383160313544e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 87, - "real_time": 7.8886750143492362e+06, - "cpu_time": 1.3464145241379088e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1267470100470364e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 87, - "real_time": 7.7860281995401299e+06, - "cpu_time": 1.3282019367816301e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1547849005980892e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 87, - "real_time": 7.8222674542459948e+06, - "cpu_time": 1.3328153022988662e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1448021431296346e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 87, - "real_time": 7.8284045221048528e+06, - "cpu_time": 1.3337664999999786e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1431207281926517e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8260088821166549e+06, - "cpu_time": 1.3347632225287303e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1438186195997536e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8222674542459948e+06, - "cpu_time": 1.3328153022988662e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1448021431296346e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8731826855888634e+04, - "cpu_time": 6.8591868070928584e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0571452231741862e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9491161381627598e-03, - "cpu_time": 5.1388790845600463e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9311318294807654e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3753764166989747e+07, - "cpu_time": 2.5208431078431647e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4396544533265743e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3704549740342533e+07, - "cpu_time": 2.5118256156863660e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4484154996515293e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3688876074464882e+07, - "cpu_time": 2.5062077607842907e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4512189180083356e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3667981980331972e+07, - "cpu_time": 2.5061052529411774e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4549660694815331e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3663266675875468e+07, - "cpu_time": 2.4982486686274022e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4558132982389450e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3695687727600923e+07, - "cpu_time": 2.5086460811764803e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4500136477413836e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3688876074464882e+07, - "cpu_time": 2.5062077607842907e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4512189180083356e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6457302859116266e+04, - "cpu_time": 8.3573964452823682e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5092643524625730e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6619548856713381e-03, - "cpu_time": 3.3314370281211599e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6568277929648791e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5347997301391192e+07, - "cpu_time": 4.8319042428571738e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6475016231880698e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.5383615068026952e+07, - "cpu_time": 4.8318439535715841e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6437867033577075e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.5252980113561664e+07, - "cpu_time": 4.8165034499999948e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6574631468529282e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5414757962737765e+07, - "cpu_time": 4.8324208928570606e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6405470435088420e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5381243455090694e+07, - "cpu_time": 4.8313005749999352e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6440337376985378e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5356118780161656e+07, - "cpu_time": 4.8287946228571497e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6466664509212170e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5381243455090694e+07, - "cpu_time": 4.8318439535715848e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6440337376985378e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.2308490260676830e+04, - "cpu_time": 6.8824180854553633e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5180025272041736e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4573354779133744e-03, - "cpu_time": 1.4252869759416491e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4627215586367044e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.5931733896334969e+07, - "cpu_time": 8.8094783133332536e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9221132453419018e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.6064277986685432e+07, - "cpu_time": 8.8262258800000384e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9137052368170128e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5985420296589531e+07, - "cpu_time": 8.8215292533334389e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9187017783972311e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.5873675495386124e+07, - "cpu_time": 8.8072767800000906e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9258115150049253e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.5939083149035774e+07, - "cpu_time": 8.8197541933334380e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9216457708694420e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5958838164806373e+07, - "cpu_time": 8.8168528840000525e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9203955092861023e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5939083149035767e+07, - "cpu_time": 8.8197541933334380e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9216457708694420e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1066426755604698e+04, - "cpu_time": 8.1275017723240220e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5131851053551966e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5463059901724150e-03, - "cpu_time": 9.2181437971739378e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5454020152422627e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.7765168398618698e+07, - "cpu_time": 1.6801173762500098e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0585648144694362e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.7353305891156197e+07, - "cpu_time": 1.6684306724999943e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0729856559118147e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.7321687489748001e+07, - "cpu_time": 1.6697040237500006e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0740983565109830e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.7479706853628159e+07, - "cpu_time": 1.6699873424999368e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0685454450498862e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.7955432012677193e+07, - "cpu_time": 1.6804949849999672e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0519485818830366e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7575060129165664e+07, - "cpu_time": 1.6737468799999818e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0652285707650318e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7479706853628159e+07, - "cpu_time": 1.6699873424999368e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0685454450498862e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7535831543197215e+05, - "cpu_time": 6.0179110705938865e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6256282502245009e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1442549400005253e-03, - "cpu_time": 3.5954726144696099e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1402644298797262e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6883483529090881e+08, - "cpu_time": 3.1379676200000972e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1798586534286666e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6941775754094124e+08, - "cpu_time": 3.1604303200001025e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1689175904141016e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6910199820995331e+08, - "cpu_time": 3.1363901099999225e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1748348197129693e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6954611614346504e+08, - "cpu_time": 3.1578085249999785e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1665184919111643e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6830755025148392e+08, - "cpu_time": 3.1287779000000173e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1898207252010465e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6904165148735049e+08, - "cpu_time": 3.1442748950000238e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1759900561335893e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6910199820995331e+08, - "cpu_time": 3.1379676200000972e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1748348197129693e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9529275265536987e+05, - "cpu_time": 1.4020211342597788e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3182391477875262e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9300042226127502e-03, - "cpu_time": 4.4589648840476729e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9339635776855781e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.2825644314289093e+08, - "cpu_time": 5.6972759350000501e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2710456913486910e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.3334909379482269e+08, - "cpu_time": 5.7673104549999726e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2210731752008033e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.2752867043018341e+08, - "cpu_time": 5.7053947200000715e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2783139948930998e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2927018404006958e+08, - "cpu_time": 5.7399297800000679e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2609749562667179e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.2902532815933228e+08, - "cpu_time": 5.7473825599998915e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2634017265687060e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2948594391345984e+08, - "cpu_time": 5.7314586900000107e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2589619088556037e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2902532815933228e+08, - "cpu_time": 5.7399297800000679e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2634017265687060e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2652393822090030e+06, - "cpu_time": 2.9404376063471017e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2247705008155786e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8750713772602490e-03, - "cpu_time": 5.1303477271456982e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8266232102013576e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2600090174866435e+06, - "cpu_time": 2.5695969902912681e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8123821490567159e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2642627738199187e+06, - "cpu_time": 2.5744609449838824e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8089773180741975e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2596957608092949e+06, - "cpu_time": 2.5764080258898009e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8126333956271373e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2572683159888852e+06, - "cpu_time": 2.5664961941747107e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8145826842944836e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2635994671955463e+06, - "cpu_time": 2.5744267346278355e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8095074059522904e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2609670670600580e+06, - "cpu_time": 2.5722777779934993e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8116165906009648e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2600090174866435e+06, - "cpu_time": 2.5744267346278355e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8123821490567159e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9157353948604691e+03, - "cpu_time": 4.0944021103834166e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3362418199031649e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2895965789770695e-03, - "cpu_time": 1.5917418194147165e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2895895478237849e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 310, - "real_time": 2.2590366560184667e+06, - "cpu_time": 2.5710351548388000e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6263245123425010e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 310, - "real_time": 2.2739739938368718e+06, - "cpu_time": 2.5854786483870568e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6025038202735353e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 310, - "real_time": 2.2588389640253396e+06, - "cpu_time": 2.5709762419353412e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6266418857064224e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 310, - "real_time": 2.2646800291934800e+06, - "cpu_time": 2.5760841161290077e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6172880470524635e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 310, - "real_time": 2.2585592307751216e+06, - "cpu_time": 2.5768473193548494e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6270910624684230e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2630177747698561e+06, - "cpu_time": 2.5760842961290111e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6199698655686695e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2590366560184667e+06, - "cpu_time": 2.5760841161290077e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6263245123425010e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6331027113118671e+03, - "cpu_time": 5.9249916505637511e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0581395494122093e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9310873229824448e-03, - "cpu_time": 2.2999991341382045e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9230617621342648e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2749476041343412e+06, - "cpu_time": 2.5892622783172205e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2019241103508445e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2678811835504849e+06, - "cpu_time": 2.5883969223300456e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2243643621355863e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2675844977841889e+06, - "cpu_time": 2.5881509676375580e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2253095820728708e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2736204980984088e+06, - "cpu_time": 2.5885821326861572e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2061278536603218e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2675441073187445e+06, - "cpu_time": 2.5884359352750722e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2254382823773371e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2703155781772337e+06, - "cpu_time": 2.5885656472492106e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2166328381193923e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2678811835504849e+06, - "cpu_time": 2.5884359352750718e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2243643621355863e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6552800228560532e+03, - "cpu_time": 4.1917153179785464e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1611412154710662e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6100316881016007e-03, - "cpu_time": 1.6193196886596072e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6089792033449940e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 307, - "real_time": 2.2812229277814832e+06, - "cpu_time": 2.6062090553745935e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4364225258715628e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 307, - "real_time": 2.2826056164486110e+06, - "cpu_time": 2.6085501954397950e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4355524127283122e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 307, - "real_time": 2.2814944902198324e+06, - "cpu_time": 2.6066741335504455e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4362515509227751e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 307, - "real_time": 2.2876287032379876e+06, - "cpu_time": 2.6058994723127107e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4324002821620073e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 307, - "real_time": 2.2869376042487663e+06, - "cpu_time": 2.6062817557002665e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4328331450373752e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2839778683873364e+06, - "cpu_time": 2.6067229224755624e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4346919833444066e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2826056164486110e+06, - "cpu_time": 2.6062817557002660e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4355524127283122e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0711794036791334e+03, - "cpu_time": 1.0580718948257218e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9283763476773020e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3446625057919766e-03, - "cpu_time": 4.0590117411515607e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3441047765403058e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 302, - "real_time": 2.3126381253576931e+06, - "cpu_time": 2.6482020728477114e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8338199254526094e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 302, - "real_time": 2.3138959003945454e+06, - "cpu_time": 2.6492488278147192e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8322795329221755e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 302, - "real_time": 2.3213322073936658e+06, - "cpu_time": 2.6510891721854843e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8232064239345644e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 302, - "real_time": 2.3149258359982972e+06, - "cpu_time": 2.6512511986754518e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8310194210493147e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 302, - "real_time": 2.3139907333950531e+06, - "cpu_time": 2.6435309172185366e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8321634591788769e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3153565605078512e+06, - "cpu_time": 2.6486644377483809e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8304977525075078e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3139907333950531e+06, - "cpu_time": 2.6492488278147196e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8321634591788769e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4381237848615333e+03, - "cpu_time": 3.1416156374866878e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1958838068174031e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4849219526289347e-03, - "cpu_time": 1.1861131190168289e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4823837267139020e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 292, - "real_time": 2.4003613666848163e+06, - "cpu_time": 2.7534462226027427e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4605111471622281e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 292, - "real_time": 2.3937482029607850e+06, - "cpu_time": 2.7530366061644643e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4755967999424227e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 292, - "real_time": 2.3993777927674660e+06, - "cpu_time": 2.7528733356164545e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4627495676210403e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 292, - "real_time": 2.3908802580841091e+06, - "cpu_time": 2.7434804589042696e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4821649706971236e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 292, - "real_time": 2.3903980610369104e+06, - "cpu_time": 2.7390575890411139e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4832708466615550e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3949531363068176e+06, - "cpu_time": 2.7483788424658091e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4728586664168745e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3937482029607850e+06, - "cpu_time": 2.7528733356164540e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4755967999424227e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6801563198453850e+03, - "cpu_time": 6.6793244369458234e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0690805421014826e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9541744883837301e-03, - "cpu_time": 2.4302779273883590e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9534225297314655e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 280, - "real_time": 2.5002882824212844e+06, - "cpu_time": 2.8842706214285432e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0484550995301197e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 280, - "real_time": 2.5001825531944633e+06, - "cpu_time": 2.8864867035713769e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0484994372313362e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 280, - "real_time": 2.4987842979109180e+06, - "cpu_time": 2.8812036142856609e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0490861504899110e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 280, - "real_time": 2.5052751747093028e+06, - "cpu_time": 2.8877715107142874e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0463680902055703e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 280, - "real_time": 2.4924419928408628e+06, - "cpu_time": 2.8756700857144324e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0517556707556939e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4993944602153664e+06, - "cpu_time": 2.8830805071428604e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0488328896425264e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5001825531944633e+06, - "cpu_time": 2.8842706214285432e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0484994372313362e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6019537228431200e+03, - "cpu_time": 4.8337649190566208e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9323523640889101e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8412274637299875e-03, - "cpu_time": 1.6765972740202439e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8423834560980573e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 270, - "real_time": 2.5955991534930137e+06, - "cpu_time": 3.0532788481482216e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0199112767256156e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 270, - "real_time": 2.5944453595137154e+06, - "cpu_time": 3.0408749444444748e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0208095656262687e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 270, - "real_time": 2.5928127484534075e+06, - "cpu_time": 3.0428158814814836e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0220820046211734e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 270, - "real_time": 2.5968429899808983e+06, - "cpu_time": 3.0432826074074991e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0189437791302758e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 270, - "real_time": 2.5964791412223820e+06, - "cpu_time": 3.0485874925924842e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0192266969384292e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5952358785326835e+06, - "cpu_time": 3.0457679548148327e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0201946646083528e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5955991534930137e+06, - "cpu_time": 3.0432826074074991e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0199112767256156e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6398900670014166e+03, - "cpu_time": 5.0792851643108897e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2769240545153811e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.3188478572074594e-04, - "cpu_time": 1.6676533602244447e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3207970839925637e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 255, - "real_time": 2.7522569412694257e+06, - "cpu_time": 3.3423609529412109e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8098768478947479e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 255, - "real_time": 2.7481577843062435e+06, - "cpu_time": 3.3383941098040226e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8155596668722826e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 255, - "real_time": 2.7521641021046569e+06, - "cpu_time": 3.3405116078432575e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8100053670423383e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 255, - "real_time": 2.7458048754316918e+06, - "cpu_time": 3.3324751843137541e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8188292597999859e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 255, - "real_time": 2.7543394662001552e+06, - "cpu_time": 3.3411313921568957e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8069962430832803e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7505446338624349e+06, - "cpu_time": 3.3389746494118283e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8122534769385272e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7521641021046569e+06, - "cpu_time": 3.3405116078432570e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8100053670423383e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4683492938808704e+03, - "cpu_time": 3.9070738690708117e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8091756994312443e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2609681919651173e-03, - "cpu_time": 1.1701418187643488e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2615047054251247e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 227, - "real_time": 3.0904596298112483e+06, - "cpu_time": 3.9963960176211339e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7858902920795798e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 227, - "real_time": 3.0867147581479494e+06, - "cpu_time": 4.0084552995595629e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7941230865734613e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 227, - "real_time": 3.0834844596437817e+06, - "cpu_time": 3.9928599603524264e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8012406984605742e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 227, - "real_time": 3.0904434393631862e+06, - "cpu_time": 4.0049709691629689e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7859258425131941e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 227, - "real_time": 3.0873667783132601e+06, - "cpu_time": 3.9950293524229247e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7926882375334418e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0876938130558850e+06, - "cpu_time": 3.9995423198238038e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7919736314320505e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0873667783132605e+06, - "cpu_time": 3.9963960176211335e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7926882375334418e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9152334184201272e+03, - "cpu_time": 6.7792230718115261e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4146730061632919e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.4414588846001093e-04, - "cpu_time": 1.6949997098943505e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4444904445407766e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 194, - "real_time": 3.6075955482449420e+06, - "cpu_time": 5.0669181649483955e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1626314380059831e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 194, - "real_time": 3.6124401106547141e+06, - "cpu_time": 5.0700931030927766e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1610722590608788e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 194, - "real_time": 3.6106504219075302e+06, - "cpu_time": 5.0731493556700516e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1616477669926634e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 194, - "real_time": 3.6086875383655741e+06, - "cpu_time": 5.0660978195876908e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1622796253231888e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 194, - "real_time": 3.6091799223699518e+06, - "cpu_time": 5.0696896546393177e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1621210607992711e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6097107083085426e+06, - "cpu_time": 5.0691896195876468e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1619504300363972e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6091799223699518e+06, - "cpu_time": 5.0696896546393177e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1621210607992711e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8798411742405108e+03, - "cpu_time": 2.8046640062416468e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0498872452302778e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.2077336001293481e-04, - "cpu_time": 5.5327660172826444e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2066655244843534e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 144, - "real_time": 4.8555973141143722e+06, - "cpu_time": 7.5064272569444291e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7276160804389162e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 144, - "real_time": 4.9242753205665695e+06, - "cpu_time": 7.5905172777777826e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7035213211910410e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 144, - "real_time": 4.9131074790946310e+06, - "cpu_time": 7.5814197152779019e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7073935458757398e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 144, - "real_time": 4.9007253805434126e+06, - "cpu_time": 7.5675086180552058e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7117074205594106e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 144, - "real_time": 4.9668165997395087e+06, - "cpu_time": 7.6667158958332799e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6889304913009980e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9121044188116994e+06, - "cpu_time": 7.5825177527777208e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7078337718732212e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9131074790946310e+06, - "cpu_time": 7.5814197152779009e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7073935458757398e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0202907589317365e+04, - "cpu_time": 5.7379358357178207e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3986332011457471e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.1844570395030319e-03, - "cpu_time": 7.5673226529747728e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1895160066525075e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 88, - "real_time": 7.7881932533769449e+06, - "cpu_time": 1.3280076875000061e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1541858880717211e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 88, - "real_time": 7.8388116460039532e+06, - "cpu_time": 1.3361974874999695e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1402754342940030e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 88, - "real_time": 7.8538388955745511e+06, - "cpu_time": 1.3367049965909479e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1361803091547444e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 88, - "real_time": 7.8764535402032463e+06, - "cpu_time": 1.3434162499999564e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1300469702976341e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 88, - "real_time": 7.8353079416873781e+06, - "cpu_time": 1.3359490556817895e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1412324984366767e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8385210553692151e+06, - "cpu_time": 1.3360550954545338e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1403842200509560e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8388116460039522e+06, - "cpu_time": 1.3361974874999691e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1402754342940030e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2468468665874021e+04, - "cpu_time": 5.4635442352572492e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8846644562324360e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1421676916506885e-03, - "cpu_time": 4.0893105784672139e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1509670894606570e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3773931372983783e+07, - "cpu_time": 2.5227722941176400e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4360824147718444e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3744334617227901e+07, - "cpu_time": 2.5128194784313153e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4413282224620056e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3749285126287563e+07, - "cpu_time": 2.5107510098038405e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4404492082171268e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3759120604863353e+07, - "cpu_time": 2.5142871568627745e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4387046936807661e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3724161951127006e+07, - "cpu_time": 2.5081296607842941e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4449166455110626e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3750166734497920e+07, - "cpu_time": 2.5137519199999735e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4402962369285617e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3749285126287565e+07, - "cpu_time": 2.5128194784313150e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4404492082171268e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8411745027963934e+04, - "cpu_time": 5.5483857042766023e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2682517073199856e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3390197648855075e-03, - "cpu_time": 2.2072129155356994e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3392848203681682e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5335913257939477e+07, - "cpu_time": 4.8311474321427085e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6487643574075704e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.5241970284176726e+07, - "cpu_time": 4.8184712535714880e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6586222566812906e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.3822576273232698e+07, - "cpu_time": 4.5662603714285009e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.8170279834681120e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5323221792599984e+07, - "cpu_time": 4.8283674642858289e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6500918623084021e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5380736549517937e+07, - "cpu_time": 4.8343909107143998e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6440865444968581e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5020883631493367e+07, - "cpu_time": 4.7757274864285856e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6837186008724470e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5323221792599987e+07, - "cpu_time": 4.8283674642858282e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6500918623084021e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7174511249928526e+05, - "cpu_time": 1.1724678769235932e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4706884814935222e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6847377670298222e-02, - "cpu_time": 2.4550560731437278e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7837078295261226e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.5796250055233635e+07, - "cpu_time": 8.7948593466664240e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9307580388814273e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.5884175101915993e+07, - "cpu_time": 8.8015200466664582e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9251420059722385e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5773166914780937e+07, - "cpu_time": 8.8000605066667959e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9322360030251436e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.5799620449542999e+07, - "cpu_time": 8.7905371066669136e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9305423643819575e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.7474804272254311e+07, - "cpu_time": 9.0887123600001976e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.8271359947120590e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6145603358745582e+07, - "cpu_time": 8.8551378733333588e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9091628813945656e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5799620449542999e+07, - "cpu_time": 8.8000605066667959e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9305423643819575e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4424132693422516e+05, - "cpu_time": 1.3064473612436741e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5933497097859204e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6128109132051809e-02, - "cpu_time": 1.4753551891924245e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5789248993799913e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.7127114646136761e+07, - "cpu_time": 1.6654042049999872e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0809634531137605e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.7224393151700497e+07, - "cpu_time": 1.6653333850000250e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0775273556003718e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.7373133748769760e+07, - "cpu_time": 1.6694419062500286e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0722882936973705e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.7373673915863037e+07, - "cpu_time": 1.6675033312499467e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0722693000009522e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.7373673915863037e+07, - "cpu_time": 1.6680968074999213e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0722693000009522e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7294397875666618e+07, - "cpu_time": 1.6671559269999820e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0750635404826813e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7373133748769760e+07, - "cpu_time": 1.6675033312499467e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0722882936973705e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1363654679452784e+05, - "cpu_time": 1.7763611867846493e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0061486633623568e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3017621927627055e-03, - "cpu_time": 1.0655039267869685e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3027856532465429e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6953257098793983e+08, - "cpu_time": 3.1529438974999380e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1667714874576626e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6811056435108185e+08, - "cpu_time": 3.1126445499998569e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1935584421619072e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6956792771816254e+08, - "cpu_time": 3.1567451300000471e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1661111816636028e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6776176542043686e+08, - "cpu_time": 3.1102028449998897e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2001982731554995e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6972156986594200e+08, - "cpu_time": 3.1606482800000888e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1632450278656878e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6893887966871262e+08, - "cpu_time": 3.1386369404999644e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1779768824608722e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6953257098793983e+08, - "cpu_time": 3.1529438974999380e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1667714874576626e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2634753127348702e+05, - "cpu_time": 2.5005983098930260e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7463952012100812e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4833294330472945e-03, - "cpu_time": 7.9671473868994144e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4953049244894350e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.2118438184261322e+08, - "cpu_time": 5.6285165600002074e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3430698524007154e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.1957006454467773e+08, - "cpu_time": 5.5946652399995852e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3599574651332359e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.1947125494480133e+08, - "cpu_time": 5.5901376399998522e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3609966699054742e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2023563981056213e+08, - "cpu_time": 5.5963666299999201e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3529741556410780e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.1954620778560638e+08, - "cpu_time": 5.5891955750001895e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3602083136608748e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2000150978565216e+08, - "cpu_time": 5.5997763289999509e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3554412913482757e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1957006454467773e+08, - "cpu_time": 5.5946652399995852e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3599574651332359e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2948925199684722e+05, - "cpu_time": 1.6344776205440599e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6341636498676138e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2796431569509900e-03, - "cpu_time": 2.9188266182695135e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2751593566997181e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 310, - "real_time": 2.2559926439557346e+06, - "cpu_time": 2.5732202290320797e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8156087569585040e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 310, - "real_time": 2.2582016750088623e+06, - "cpu_time": 2.5771280193544775e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8138326816996650e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 310, - "real_time": 2.2586285339428051e+06, - "cpu_time": 2.5711353516128603e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8134898848770687e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 310, - "real_time": 2.2546584432524056e+06, - "cpu_time": 2.5751302612900049e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8166831487306827e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 310, - "real_time": 2.2569128988130437e+06, - "cpu_time": 2.5703424064515950e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8148684435957493e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2568788389945705e+06, - "cpu_time": 2.5733912535482035e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8148965831723341e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2569128988130437e+06, - "cpu_time": 2.5732202290320797e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8148684435957493e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6223429431576446e+03, - "cpu_time": 2.8018466304414578e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3048454187268549e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1884361496357121e-04, - "cpu_time": 1.0887759980447041e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1896406154782694e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 310, - "real_time": 2.2633655800393992e+06, - "cpu_time": 2.5811816870967252e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6193887864360819e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 310, - "real_time": 2.2609800310625182e+06, - "cpu_time": 2.5786435290320520e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6232075858495198e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 310, - "real_time": 2.2633475289049167e+06, - "cpu_time": 2.5858345451612673e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6194176525615416e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 310, - "real_time": 2.2577031027345406e+06, - "cpu_time": 2.5748671903226837e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6284664666836886e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 310, - "real_time": 2.2649728129768083e+06, - "cpu_time": 2.5887546677418253e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6168204550029095e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2620738111436367e+06, - "cpu_time": 2.5818563238709113e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6214601893067481e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2633475289049167e+06, - "cpu_time": 2.5811816870967252e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6194176525615416e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8281921038583009e+03, - "cpu_time": 5.5461375298219700e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5313110130590585e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2502651725712045e-03, - "cpu_time": 2.1481201252542157e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2512386651215631e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 307, - "real_time": 2.2700542207892244e+06, - "cpu_time": 2.5945861986970408e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2174487507632365e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 307, - "real_time": 2.2702178870804049e+06, - "cpu_time": 2.5907261563515370e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2169284249057295e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 307, - "real_time": 2.2657341816756837e+06, - "cpu_time": 2.5860251856676699e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2312101448205980e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 307, - "real_time": 2.2687836396978130e+06, - "cpu_time": 2.5957727915307316e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2214907201033235e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 307, - "real_time": 2.2659864843935259e+06, - "cpu_time": 2.5844610423453869e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2304049970470378e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2681552827273305e+06, - "cpu_time": 2.5903142749184733e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2234966075279852e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2687836396978130e+06, - "cpu_time": 2.5907261563515370e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2214907201033235e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1691329761038824e+03, - "cpu_time": 5.0217278112732456e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9095166630943240e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5634236007669654e-04, - "cpu_time": 1.9386558070955686e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5653352365301231e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 307, - "real_time": 2.2887587463877588e+06, - "cpu_time": 2.6195855863192063e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4316930542249685e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 307, - "real_time": 2.2855425543221571e+06, - "cpu_time": 2.6127218273615432e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4337077180222658e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 307, - "real_time": 2.2881484601088474e+06, - "cpu_time": 2.6192443583060759e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4320749099663412e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 307, - "real_time": 2.2874672552843727e+06, - "cpu_time": 2.6125479771985961e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4325013800438581e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 307, - "real_time": 2.2900721197796180e+06, - "cpu_time": 2.6197216026057298e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4308719676109321e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2879978271765509e+06, - "cpu_time": 2.6167642703582305e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4321698059736732e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2881484601088474e+06, - "cpu_time": 2.6192443583060764e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4320749099663412e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6743841739782893e+03, - "cpu_time": 3.7740875516004171e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0483077708487499e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.3181195982363449e-04, - "cpu_time": 1.4422726549547969e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3197170229129965e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 299, - "real_time": 2.3264314015286923e+06, - "cpu_time": 2.6595381137123094e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8170183722991556e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 299, - "real_time": 2.3293242280536573e+06, - "cpu_time": 2.6691475518396068e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8135198702999257e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 299, - "real_time": 2.3304640422933376e+06, - "cpu_time": 2.6696958729099152e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8121437967138961e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 299, - "real_time": 2.3275904667355046e+06, - "cpu_time": 2.6620422474915446e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8156155877333369e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 299, - "real_time": 2.3313898392283297e+06, - "cpu_time": 2.6651747458192348e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8110270919638157e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3290399955679043e+06, - "cpu_time": 2.6651197063545221e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8138649438020259e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3293242280536569e+06, - "cpu_time": 2.6651747458192348e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8135198702999257e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0332461182366685e+03, - "cpu_time": 4.4100112927378641e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4568115280531798e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7299751060775132e-04, - "cpu_time": 1.6547141511966410e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7310925617261356e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 293, - "real_time": 2.4084046192200212e+06, - "cpu_time": 2.7685551501706019e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4422748965848021e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 293, - "real_time": 2.3911704083605837e+06, - "cpu_time": 2.7489539419794232e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4814997518250734e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 293, - "real_time": 2.3981962216312364e+06, - "cpu_time": 2.7597395665525440e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4654410184520155e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 293, - "real_time": 2.3930242997133285e+06, - "cpu_time": 2.7512339215016090e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4772531986282684e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 293, - "real_time": 2.3916596594447773e+06, - "cpu_time": 2.7502250819113334e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4803784260185376e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3964910416739900e+06, - "cpu_time": 2.7557415324231023e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4693694583017401e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3930242997133285e+06, - "cpu_time": 2.7512339215016090e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4772531986282684e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.2199491264005237e+03, - "cpu_time": 8.3215720146485801e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6432001300435074e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0127169268937743e-03, - "cpu_time": 3.0197215220440082e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0043684972668261e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 279, - "real_time": 2.5143706420015902e+06, - "cpu_time": 2.9003723010753114e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0425829653790325e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 279, - "real_time": 2.5120423188746832e+06, - "cpu_time": 2.8979715197132835e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0435492986337602e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 279, - "real_time": 2.5098590801159539e+06, - "cpu_time": 2.8984415053765168e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0444570457234161e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 279, - "real_time": 2.5133619395395122e+06, - "cpu_time": 2.9055868100358141e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0430013913874616e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 279, - "real_time": 2.5156655650933050e+06, - "cpu_time": 2.9023860000000740e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0420463023282556e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5130599091250091e+06, - "cpu_time": 2.9009516272402001e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0431274006903853e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5133619395395117e+06, - "cpu_time": 2.9003723010753114e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0430013913874616e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2293206549346951e+03, - "cpu_time": 3.1248886460929634e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2561001628655678e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.8709411456525697e-04, - "cpu_time": 1.0771943305603493e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8734129280272904e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 269, - "real_time": 2.6113682514797468e+06, - "cpu_time": 3.0662008921932848e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0077137711347651e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 269, - "real_time": 2.6169171241773325e+06, - "cpu_time": 3.0781235018586484e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0034566442940673e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 269, - "real_time": 2.6102541810850226e+06, - "cpu_time": 3.0650024052047366e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0085706740715399e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 269, - "real_time": 2.6247869107221360e+06, - "cpu_time": 3.0832816505574398e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.9974497657631069e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 269, - "real_time": 2.6048367521050475e+06, - "cpu_time": 3.0595005947956704e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0127480141560006e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6136326439138572e+06, - "cpu_time": 3.0704218089219560e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0059877738838959e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6113682514797468e+06, - "cpu_time": 3.0662008921932848e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0077137711347651e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5682672310175667e+03, - "cpu_time": 9.8887637452822892e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8020575682252587e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8956889747459892e-03, - "cpu_time": 3.2206531742797560e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8923693572626306e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 251, - "real_time": 2.7875217249193988e+06, - "cpu_time": 3.3769406135455850e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7616783059522867e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 251, - "real_time": 2.7885283473359635e+06, - "cpu_time": 3.3833714023903194e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7603203890746278e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 251, - "real_time": 2.7828466933799456e+06, - "cpu_time": 3.3715908844621670e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7679977215217608e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 251, - "real_time": 2.7898236111073620e+06, - "cpu_time": 3.3839872629483305e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7585745415058333e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 251, - "real_time": 2.7826611960002505e+06, - "cpu_time": 3.3736036215141686e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7682489032700247e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7862763145485842e+06, - "cpu_time": 3.3778987569721141e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7633639722649074e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7875217249193988e+06, - "cpu_time": 3.3769406135455845e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7616783059522867e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3180338687287731e+03, - "cpu_time": 5.6163875382649358e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4826805494034482e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1908488226395958e-03, - "cpu_time": 1.6626867595343090e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1911365954607985e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 225, - "real_time": 3.1122992549919421e+06, - "cpu_time": 3.9910988488888205e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7382723452325273e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 225, - "real_time": 3.1095152379324040e+06, - "cpu_time": 3.9789510799998119e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7443052679634070e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 225, - "real_time": 3.1001683552232054e+06, - "cpu_time": 3.9696649955552248e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7646390766704333e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 225, - "real_time": 3.1001043257613978e+06, - "cpu_time": 3.9717578888889370e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7647787933231294e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 225, - "real_time": 3.1016538664698601e+06, - "cpu_time": 3.9734093866667938e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7613992092124343e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1047482080757627e+06, - "cpu_time": 3.9769764399999180e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7546789384803867e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1016538664698601e+06, - "cpu_time": 3.9734093866667943e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7613992092124343e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.7414834373248732e+03, - "cpu_time": 8.6133036779760005e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2481614492043888e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8492589583885409e-03, - "cpu_time": 2.1657919798931924e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8478471894404949e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 186, - "real_time": 3.7539507793162460e+06, - "cpu_time": 5.2270775698923320e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1173039409866641e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 186, - "real_time": 3.7674458637352912e+06, - "cpu_time": 5.2394027043014923e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1133017305898309e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 186, - "real_time": 3.7792885152783287e+06, - "cpu_time": 5.2507099247315964e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1098131256832895e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 186, - "real_time": 3.7868360422992259e+06, - "cpu_time": 5.2614518924729638e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1076011618008618e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 186, - "real_time": 3.7634664988746084e+06, - "cpu_time": 5.2366837903230013e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1144788989763095e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7701975399007401e+06, - "cpu_time": 5.2430651763442773e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1124997716073911e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7674458637352912e+06, - "cpu_time": 5.2394027043014932e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1133017305898309e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3003090592915854e+04, - "cpu_time": 1.3287709142307538e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8358366471996694e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4489149322552981e-03, - "cpu_time": 2.5343398747471571e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4479437615141935e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 133, - "real_time": 5.2696417954127146e+06, - "cpu_time": 8.1056103233079817e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.5918744244252775e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 133, - "real_time": 5.3372561294389395e+06, - "cpu_time": 8.1926622481205408e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.5717079706425524e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 133, - "real_time": 5.3122442992950296e+06, - "cpu_time": 8.1690210451129088e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.5791080995866897e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 133, - "real_time": 5.3091754653680148e+06, - "cpu_time": 8.1622787669166978e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.5800208628852558e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 133, - "real_time": 5.3111230849491479e+06, - "cpu_time": 8.1703635563906888e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.5794414600881574e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3078881548927687e+06, - "cpu_time": 8.1599871879697638e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.5804305635255868e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3111230849491470e+06, - "cpu_time": 8.1690210451129097e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.5794414600881574e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4271175688359835e+04, - "cpu_time": 3.2477045342639518e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2446647607960440e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5726614766716323e-03, - "cpu_time": 3.9800363155619032e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5839816870124417e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 83, - "real_time": 8.3905264555689804e+06, - "cpu_time": 1.3857575903613677e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9995427091305561e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 83, - "real_time": 8.3908714937517438e+06, - "cpu_time": 1.3860120409639508e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9994604866125219e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 83, - "real_time": 8.3818961473473581e+06, - "cpu_time": 1.3848909975903200e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0016015117664673e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 83, - "real_time": 8.3871489637587443e+06, - "cpu_time": 1.3862676807229122e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0003479218617816e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 83, - "real_time": 8.3903066409998629e+06, - "cpu_time": 1.3864104746988300e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9995950944172738e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3881499402853381e+06, - "cpu_time": 1.3858677568674762e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0001095447577202e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3903066409998629e+06, - "cpu_time": 1.3860120409639511e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9995950944172738e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8019046619523251e+03, - "cpu_time": 6.0031137384729063e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0692164124581346e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5324710323704542e-04, - "cpu_time": 4.3316641928678299e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5343598485535544e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 48, - "real_time": 1.3940245689203342e+07, - "cpu_time": 2.4647182520835053e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4070186959464965e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 48, - "real_time": 1.4407394938947013e+07, - "cpu_time": 2.5163408291665707e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3289728741518335e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 48, - "real_time": 1.4397068201409033e+07, - "cpu_time": 2.5118535958334576e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3306434011833081e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 48, - "real_time": 1.4461928648718944e+07, - "cpu_time": 2.5236190312500164e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3201906754651494e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 48, - "real_time": 1.4420718265076479e+07, - "cpu_time": 2.5165305395833094e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3268211321526742e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4325471148670962e+07, - "cpu_time": 2.5066124495833725e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3427293557798920e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4407394938947013e+07, - "cpu_time": 2.5163408291665711e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3289728741518335e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1675387107215193e+05, - "cpu_time": 2.3795099793433218e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6157620336742297e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5130662637386359e-02, - "cpu_time": 9.4929313055108436e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5433972450780797e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27, - "real_time": 2.6525566837301962e+07, - "cpu_time": 4.8506776592594855e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5299690827201171e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27, - "real_time": 2.6410722208243828e+07, - "cpu_time": 4.8265675703705542e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5409704237111955e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27, - "real_time": 2.6494159466690488e+07, - "cpu_time": 4.8493755555556260e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5329682220857749e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27, - "real_time": 2.6465045288205147e+07, - "cpu_time": 4.8365955703704655e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5357547387197881e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27, - "real_time": 2.6505359551972814e+07, - "cpu_time": 4.8396105999998964e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5318978928925729e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6480170670482852e+07, - "cpu_time": 4.8405653911112063e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5343120720258899e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6494159466690488e+07, - "cpu_time": 4.8396105999998964e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5329682220857749e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4561317942747613e+04, - "cpu_time": 9.9056429989066150e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2693876614990113e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6828183812432757e-03, - "cpu_time": 2.0463814035229185e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6846337547080888e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 14, - "real_time": 4.9681618277515687e+07, - "cpu_time": 9.0979318357142344e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7015570879812236e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 14, - "real_time": 4.9551115504332952e+07, - "cpu_time": 9.0817518285713762e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7086721788990493e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 14, - "real_time": 5.0608436710068159e+07, - "cpu_time": 9.2430238285714954e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.6520820781112652e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 14, - "real_time": 4.9380496942571230e+07, - "cpu_time": 9.0615186571426421e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7180311319283233e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 14, - "real_time": 4.9348133217011176e+07, - "cpu_time": 9.0721041571433559e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7198136839294410e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9713960130299844e+07, - "cpu_time": 9.1112660614286214e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7000312321698608e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9551115504332952e+07, - "cpu_time": 9.0817518285713762e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7086721788990493e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1785126905741618e+05, - "cpu_time": 7.4862306435516675e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7800437767212227e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0416616735020357e-02, - "cpu_time": 8.2164548736466669e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0296339329701237e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7, - "real_time": 9.5367081463336945e+07, - "cpu_time": 1.7353544057142958e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8147601025538116e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7, - "real_time": 9.6825783806187764e+07, - "cpu_time": 1.7482611685712916e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.7723551046828222e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7, - "real_time": 9.5486328005790710e+07, - "cpu_time": 1.7337804371428385e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8112449353348355e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7, - "real_time": 9.5504111477306917e+07, - "cpu_time": 1.7347998928572193e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8107214636909528e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7, - "real_time": 9.5386922359466553e+07, - "cpu_time": 1.7347605642856121e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8141746201685629e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5714045422417790e+07, - "cpu_time": 1.7373912937142515e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8046512452861972e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5486328005790710e+07, - "cpu_time": 1.7347998928572193e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8112449353348355e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.2435630939134571e+05, - "cpu_time": 6.1028164202717319e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8140070715240333e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.5231419969332049e-03, - "cpu_time": 3.5126320952287801e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4678525523373057e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8729038536548615e+08, - "cpu_time": 3.3286879599998540e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8665161372396564e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8544181808829308e+08, - "cpu_time": 3.2933091450001937e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8950908567148728e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8770507350564003e+08, - "cpu_time": 3.3337344999998206e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8601832756740508e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8626366183161736e+08, - "cpu_time": 3.2958761849999976e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8823169625288057e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8710634112358093e+08, - "cpu_time": 3.3286467524999350e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8693357412478333e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8676145598292351e+08, - "cpu_time": 3.3160509084999609e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8746885946810441e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8710634112358093e+08, - "cpu_time": 3.3286467524999350e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8693357412478333e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0531338098920265e+05, - "cpu_time": 1.9718437060167626e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3966841734198894e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.8474315871256633e-03, - "cpu_time": 5.9463613811307258e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8585581617575386e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.6988337337970734e+08, - "cpu_time": 6.0993692649998367e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9029199506562843e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.6828731000423431e+08, - "cpu_time": 6.1107849849997818e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9155004661650028e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.6918786168098450e+08, - "cpu_time": 6.0871288399999917e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9083887512201610e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.6354982852935791e+08, - "cpu_time": 6.0807743700001991e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9534928632576475e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.6453041434288025e+08, - "cpu_time": 6.0529078849998546e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9455479755662575e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6708775758743292e+08, - "cpu_time": 6.0861930689999330e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9251700013730707e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6828731000423431e+08, - "cpu_time": 6.0871288399999917e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9155004661650028e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8601476077597616e+06, - "cpu_time": 2.1889015017033070e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2845247658339798e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7914546280626979e-03, - "cpu_time": 3.5965035563076237e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8098871681359615e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 311, - "real_time": 2.2505455196706331e+06, - "cpu_time": 2.5734133826366453e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8200031788734710e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 311, - "real_time": 2.2489820446795109e+06, - "cpu_time": 2.5692689228295111e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8212684310619726e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 311, - "real_time": 2.2501560995636741e+06, - "cpu_time": 2.5845736559486645e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8203181551689911e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 311, - "real_time": 2.2495511104727099e+06, - "cpu_time": 2.5701823987138388e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8208077073382370e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 311, - "real_time": 2.2483394747761670e+06, - "cpu_time": 2.5740397331188647e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8217889451092687e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2495148498325394e+06, - "cpu_time": 2.5742956186495051e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8208372835103886e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2495511104727099e+06, - "cpu_time": 2.5734133826366449e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8208077073382370e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8602824740745166e+02, - "cpu_time": 6.0964768024783680e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1722512666820228e+02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.9387526046934533e-04, - "cpu_time": 2.3682116219723927e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9389852853049308e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2504143726818459e+06, - "cpu_time": 2.5721185259738364e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6402184857349163e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2502024219576996e+06, - "cpu_time": 2.5841188993505416e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6405613646406420e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2505052832209249e+06, - "cpu_time": 2.5723618116883659e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6400714368799892e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2571463638299759e+06, - "cpu_time": 2.5791607662335401e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6293614500477640e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2493645430893288e+06, - "cpu_time": 2.5768434610390081e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6419174584964872e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2515265969559550e+06, - "cpu_time": 2.5769206928570583e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6384260391599606e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2504143726818454e+06, - "cpu_time": 2.5768434610390076e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6402184857349163e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1737131505228485e+03, - "cpu_time": 5.0170278674353031e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1194872308499744e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4095827936537288e-03, - "cpu_time": 1.9469081378181152e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4070609587083873e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 310, - "real_time": 2.2586399621720756e+06, - "cpu_time": 2.5909363774193511e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2539228360433020e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 310, - "real_time": 2.2654539409784540e+06, - "cpu_time": 2.5891805967742791e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2321046584260808e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 310, - "real_time": 2.2639674870597739e+06, - "cpu_time": 2.5874768193547893e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2368530438915379e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 310, - "real_time": 2.2579189487582734e+06, - "cpu_time": 2.5878537838711087e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2562392060221052e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 310, - "real_time": 2.2593357074525086e+06, - "cpu_time": 2.5903866967742182e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2516890455706622e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2610632092842171e+06, - "cpu_time": 2.5891668548387489e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2461617579907374e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2593357074525086e+06, - "cpu_time": 2.5891805967742791e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2516890455706622e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4079362379007180e+03, - "cpu_time": 1.5165576689628656e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0915521125239366e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5072273185054233e-03, - "cpu_time": 5.8573191840790629e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5063866209172360e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2744202038406259e+06, - "cpu_time": 2.6079823961037043e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4407188234024379e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2805839030120475e+06, - "cpu_time": 2.6084475779219414e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4368250147132123e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2806779250151827e+06, - "cpu_time": 2.6092506753247543e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4367657809369054e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2747106222714018e+06, - "cpu_time": 2.6102576396103310e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4405348829505030e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2745371067461064e+06, - "cpu_time": 2.6086347792208367e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4406447757133780e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2769859521770729e+06, - "cpu_time": 2.6089146136363135e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4390978555432875e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2747106222714018e+06, - "cpu_time": 2.6086347792208362e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4405348829505030e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3291496022954043e+03, - "cpu_time": 8.7779772997356088e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1029695663216338e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4620861402822169e-03, - "cpu_time": 3.3646088890202649e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4613110277533711e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 304, - "real_time": 2.3033263293511579e+06, - "cpu_time": 2.6465796250000633e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8452763798545800e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 304, - "real_time": 2.3045315718168002e+06, - "cpu_time": 2.6486118585526845e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8437883343179390e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 304, - "real_time": 2.3027568455099277e+06, - "cpu_time": 2.6397309177631796e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8459800316210791e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 304, - "real_time": 2.3189921906266948e+06, - "cpu_time": 2.6558297434208174e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8260552262700487e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 304, - "real_time": 2.3034889630875303e+06, - "cpu_time": 2.6411438453948223e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8450754941824172e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3066191800784222e+06, - "cpu_time": 2.6463791980263134e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8412350932492133e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3034889630875303e+06, - "cpu_time": 2.6465796250000629e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8450754941824172e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9463704716123102e+03, - "cpu_time": 6.4410072946839673e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5226539051811793e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0114942820236761e-03, - "cpu_time": 2.4338943185042085e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9996299586158995e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 294, - "real_time": 2.3679862378583271e+06, - "cpu_time": 2.7235171156461686e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5351673039512753e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 294, - "real_time": 2.3672167571312208e+06, - "cpu_time": 2.7229394251699718e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5369665496472463e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 294, - "real_time": 2.3669522583522662e+06, - "cpu_time": 2.7238473945578714e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5375852866269752e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 294, - "real_time": 2.3742720514827338e+06, - "cpu_time": 2.7306174761906113e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5205131155103095e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 294, - "real_time": 2.3602458322103941e+06, - "cpu_time": 2.7167157789116893e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5533198369107910e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3673346274069892e+06, - "cpu_time": 2.7235274380952627e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5367104185293198e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3672167571312212e+06, - "cpu_time": 2.7235171156461686e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5369665496472463e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9740216581272889e+03, - "cpu_time": 4.9273618427618449e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1634405915215440e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1011062823744022e-03, - "cpu_time": 1.8091838451269155e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1013210075570129e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 279, - "real_time": 2.4944601295095296e+06, - "cpu_time": 2.8834864910393623e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0509047504862054e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 279, - "real_time": 2.4926209560258309e+06, - "cpu_time": 2.8852307598564238e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0516801576520303e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 279, - "real_time": 2.4959075374789136e+06, - "cpu_time": 2.8852984157704483e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0502953176894867e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 279, - "real_time": 2.4892546171422605e+06, - "cpu_time": 2.8784833405016246e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0531023953706640e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 279, - "real_time": 2.4870375712071694e+06, - "cpu_time": 2.8837569964159187e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0540411734622866e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4918561622727411e+06, - "cpu_time": 2.8832512007167554e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0520047589321347e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4926209560258305e+06, - "cpu_time": 2.8837569964159187e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0516801576520303e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6662669309968960e+03, - "cpu_time": 2.7907626971197787e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5483348978822379e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4712995824177160e-03, - "cpu_time": 9.6792214858907027e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4717945757716118e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 271, - "real_time": 2.5822777486650269e+06, - "cpu_time": 3.0388210479702214e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0303315562047648e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 271, - "real_time": 2.5861024473384847e+06, - "cpu_time": 3.0480577232471770e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0273288111210623e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 271, - "real_time": 2.5866703728275765e+06, - "cpu_time": 3.0417942804428516e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0268836938310122e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 271, - "real_time": 2.5826868793593780e+06, - "cpu_time": 3.0411069298891081e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0300099256710783e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 271, - "real_time": 2.5873936324404394e+06, - "cpu_time": 3.0437354059041617e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0263171147464314e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5850262161261817e+06, - "cpu_time": 3.0427030774907041e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0281742203148699e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5861024473384852e+06, - "cpu_time": 3.0417942804428516e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0273288111210623e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3713263574394732e+03, - "cpu_time": 3.4706514361757922e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8609761349893769e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.1733164741093017e-04, - "cpu_time": 1.1406474269050316e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1756226676644381e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 255, - "real_time": 2.7423737196288272e+06, - "cpu_time": 3.3375854078432145e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8236072366603696e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 255, - "real_time": 2.7455792625379912e+06, - "cpu_time": 3.3438255882352749e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8191430650255746e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 255, - "real_time": 2.7458153299841224e+06, - "cpu_time": 3.3415150549016665e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8188147198015070e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 255, - "real_time": 2.7443983774705259e+06, - "cpu_time": 3.3415350196077377e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8207864011581945e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 255, - "real_time": 2.7457387990080845e+06, - "cpu_time": 3.3382368313725377e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8189211602312821e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7447810977259106e+06, - "cpu_time": 3.3405395803920864e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8202545165753859e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7455792625379912e+06, - "cpu_time": 3.3415150549016660e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8191430650255746e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4633727539285996e+03, - "cpu_time": 2.5869908090773342e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0377568304388039e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.3314734466111864e-04, - "cpu_time": 7.7442303760211510e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3340865683093879e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 228, - "real_time": 3.0790301797535727e+06, - "cpu_time": 4.0094521491228435e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8110797152623022e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 228, - "real_time": 3.0774595940959426e+06, - "cpu_time": 4.0021049561404288e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8145557589882016e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 228, - "real_time": 3.0740448620921951e+06, - "cpu_time": 3.9993495175440731e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8221255514556098e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 228, - "real_time": 3.0741599314895114e+06, - "cpu_time": 3.9949298640351575e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8218701913269508e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 228, - "real_time": 3.0694729097089483e+06, - "cpu_time": 3.9910905570176663e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8322870463087249e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0748334954280341e+06, - "cpu_time": 3.9993854087720336e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8203836526683581e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0741599314895114e+06, - "cpu_time": 3.9993495175440731e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8218701913269508e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6851073154679339e+03, - "cpu_time": 7.0248297469052386e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1771386305968906e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1984737778313250e-03, - "cpu_time": 1.7564773156138842e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1989264896260967e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 194, - "real_time": 3.6049507865586230e+06, - "cpu_time": 5.0685022783505172e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1634843991875930e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 194, - "real_time": 4.2438031745517682e+06, - "cpu_time": 6.0925368092784062e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 9.8833612858188307e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 194, - "real_time": 3.5952963415034041e+06, - "cpu_time": 5.0588905309275771e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1666087024821203e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 194, - "real_time": 3.5978720064956658e+06, - "cpu_time": 5.0580343144330522e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1657735440358982e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 194, - "real_time": 3.5939957447273214e+06, - "cpu_time": 5.0586034020619588e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1670308753574288e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7271836107673571e+06, - "cpu_time": 5.2673134670103025e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1302467299289846e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5978720064956658e+06, - "cpu_time": 5.0588905309275771e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1657735440358982e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8883013496358949e+05, - "cpu_time": 4.6133426833480253e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9342268614977226e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7492864620137353e-02, - "cpu_time": 8.7584357988979414e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0199069383693274e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 142, - "real_time": 4.9312776971188653e+06, - "cpu_time": 7.6360314647887126e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7011023339653139e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 142, - "real_time": 4.9412812460476244e+06, - "cpu_time": 7.6862030915495008e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6976584780940740e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 142, - "real_time": 4.9420609040526859e+06, - "cpu_time": 7.6521822042248547e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6973906560157948e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 142, - "real_time": 4.9468192409619056e+06, - "cpu_time": 7.6462554366196878e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6957579388667617e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 142, - "real_time": 4.9359729893925320e+06, - "cpu_time": 7.6455287183100963e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6994841783022766e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9394824155147234e+06, - "cpu_time": 7.6532401830985714e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6982787170488443e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9412812460476253e+06, - "cpu_time": 7.6462554366196888e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6976584780940740e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9863778217445670e+03, - "cpu_time": 1.9313635152976272e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0587387354397352e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2119443533074612e-03, - "cpu_time": 2.5235893152325915e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2122502123899158e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 87, - "real_time": 7.8450304070680309e+06, - "cpu_time": 1.3360336988505712e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1385788364675374e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 87, - "real_time": 7.8494700806579366e+06, - "cpu_time": 1.3387048390805129e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1373692526507146e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 87, - "real_time": 7.8724477086858507e+06, - "cpu_time": 1.3426099241378691e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1311308275175097e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 87, - "real_time": 7.8347278277164903e+06, - "cpu_time": 1.3354363356322063e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1413910436873322e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 87, - "real_time": 7.8145016049002782e+06, - "cpu_time": 1.3317404954023005e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1469335919618251e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8432355258057173e+06, - "cpu_time": 1.3369050586206917e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1390807104569836e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8450304070680309e+06, - "cpu_time": 1.3360336988505710e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1385788364675374e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1174643083788731e+04, - "cpu_time": 4.0427041870411216e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7746643116011517e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6997331667677426e-03, - "cpu_time": 3.0239276611100938e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6996009469729071e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3701471116612939e+07, - "cpu_time": 2.4987132843137920e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4489656413109889e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3699745558494447e+07, - "cpu_time": 2.5020869098039284e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4492741019700742e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3684617811996562e+07, - "cpu_time": 2.4995549254901350e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4519816673714223e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3716228708040481e+07, - "cpu_time": 2.5044647450978994e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4463307454424644e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3717662579580849e+07, - "cpu_time": 2.5041795411766544e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4460750368613653e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3703945154945057e+07, - "cpu_time": 2.5017998811764818e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4485254385912628e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3701471116612941e+07, - "cpu_time": 2.5020869098039284e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4489656413109889e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3567950070782923e+04, - "cpu_time": 2.6178986372150488e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4249195515233078e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.9007620925036606e-04, - "cpu_time": 1.0464060922346719e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9035914158950434e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5350436036075864e+07, - "cpu_time": 4.8319202357142948e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6472469311572504e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.5264881684311800e+07, - "cpu_time": 4.8173652428573631e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6562112911722512e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.5374185027820725e+07, - "cpu_time": 4.8302967642858408e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6447692379645143e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5355042157960791e+07, - "cpu_time": 4.8309076214288943e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6467660192365193e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5423150908734117e+07, - "cpu_time": 4.8412885357143819e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6396753195900970e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5353539162980661e+07, - "cpu_time": 4.8303556800001547e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6469337598241267e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5355042157960787e+07, - "cpu_time": 4.8309076214288943e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6467660192365193e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.7323825317560229e+04, - "cpu_time": 8.5298701079510356e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9910122392263561e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2609792245991511e-03, - "cpu_time": 1.7658886162914534e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2633782265954489e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.6027964353561401e+07, - "cpu_time": 8.8208412399997845e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9160039963751936e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.6088519444068275e+07, - "cpu_time": 8.8198676066667765e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9121726976472492e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5907409240802132e+07, - "cpu_time": 8.8051736933334723e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9236615661749954e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.6056466052929558e+07, - "cpu_time": 8.8236075599994972e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9141994491230116e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.6003494411706924e+07, - "cpu_time": 8.8206152799997047e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9175550622051096e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6016770700613663e+07, - "cpu_time": 8.8180210759998471e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9167185543051119e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6027964353561401e+07, - "cpu_time": 8.8206152799997047e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9160039963751936e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8893195941097656e+04, - "cpu_time": 7.3204668508098912e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3711113004177781e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4971323474504247e-03, - "cpu_time": 8.3017116739878590e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4986400706938161e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.7608260102570057e+07, - "cpu_time": 1.6618887462499288e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0640427704616089e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.7536820210516453e+07, - "cpu_time": 1.6724233762499806e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0665433740275483e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.7073818780481815e+07, - "cpu_time": 1.6667505437500551e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0828492394107747e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.7470420636236668e+07, - "cpu_time": 1.6732946237499392e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0688712143770614e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.7760580703616142e+07, - "cpu_time": 1.6641018112500206e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0587247013161483e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7489980086684242e+07, - "cpu_time": 1.6676918202499849e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0682062599186287e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7536820210516453e+07, - "cpu_time": 1.6667505437500551e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0665433740275483e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5640868653225206e+05, - "cpu_time": 5.0306277729078318e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0119198885742426e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9307205954122372e-03, - "cpu_time": 3.0165212252187858e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9371949357841561e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6948897019028664e+08, - "cpu_time": 3.1385612849999231e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1675861349399357e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7040410265326500e+08, - "cpu_time": 3.1723117149999779e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1505750368722906e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6989193111658096e+08, - "cpu_time": 3.1440853000000858e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1600730445026002e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7001368850469589e+08, - "cpu_time": 3.1675782350001216e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1578099194358182e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6925028711557388e+08, - "cpu_time": 3.1392239774999100e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1720531831854057e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6980979591608047e+08, - "cpu_time": 3.1523521025000042e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1616194637872105e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6989193111658096e+08, - "cpu_time": 3.1440853000000858e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1600730445026002e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5207801342768100e+05, - "cpu_time": 1.6287231033634427e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4164581589359790e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6622610962390926e-03, - "cpu_time": 5.1666915699923495e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6620718449316960e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.2959860563278198e+08, - "cpu_time": 5.7431398950001264e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2577256264132853e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.3097773790359497e+08, - "cpu_time": 5.7686793249996531e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2441511951862831e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.3033533394336700e+08, - "cpu_time": 5.7570293600002742e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2504601042287631e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.3052547276020050e+08, - "cpu_time": 5.7583159249998057e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2485902373370490e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.2914710044860840e+08, - "cpu_time": 5.7385456750000679e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2621943882736692e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3011685013771057e+08, - "cpu_time": 5.7531420359999871e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2526243102878098e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3033533394336700e+08, - "cpu_time": 5.7570293600002742e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2504601042287631e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3566758675121644e+05, - "cpu_time": 1.2210490814409521e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2519140721660517e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2285066225620643e-03, - "cpu_time": 2.1224038513221145e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2295578524789304e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 311, - "real_time": 2.2468174818208460e+06, - "cpu_time": 2.5783496591639696e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8230230239621226e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 311, - "real_time": 2.2536928696599803e+06, - "cpu_time": 2.5817045980706965e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8174614896030498e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 311, - "real_time": 2.2459958367037717e+06, - "cpu_time": 2.5737932604502123e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8236899343550426e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 311, - "real_time": 2.2578909506548159e+06, - "cpu_time": 2.5850196591641605e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8140822960524776e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 311, - "real_time": 2.2471791561513278e+06, - "cpu_time": 2.5753816816721219e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8227296158331626e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2503152589981481e+06, - "cpu_time": 2.5788497717042323e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8201972719611712e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2471791561513273e+06, - "cpu_time": 2.5783496591639691e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8227296158331626e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2327419453349448e+03, - "cpu_time": 4.5843105243657719e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2271079336283747e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3253372719272175e-03, - "cpu_time": 1.7776570681495077e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3223350560644881e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 312, - "real_time": 2.2521156956477519e+06, - "cpu_time": 2.5827414807691020e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6374685438368754e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 312, - "real_time": 2.2461612981994851e+06, - "cpu_time": 2.5759776025638124e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6471111876812577e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 312, - "real_time": 2.2460377173653492e+06, - "cpu_time": 2.5825408461537189e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6473118579724445e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 312, - "real_time": 2.2559669689657404e+06, - "cpu_time": 2.5863369134614142e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6312588405297725e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 312, - "real_time": 2.2523095099947965e+06, - "cpu_time": 2.5825609134616256e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6371555346400533e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2505182380346246e+06, - "cpu_time": 2.5820315512819346e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6400611929320814e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2521156956477519e+06, - "cpu_time": 2.5825609134616251e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6374685438368754e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3158772287598840e+03, - "cpu_time": 3.7493347422366146e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9806994049399455e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9177259512142128e-03, - "cpu_time": 1.4520871134882660e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9177423221605153e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2517752383122002e+06, - "cpu_time": 2.5833112532465491e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2760370223630723e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2528624984544595e+06, - "cpu_time": 2.5927659740262525e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2725255142024802e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2577846221710471e+06, - "cpu_time": 2.5900280129868793e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2566709149809983e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2510604263138170e+06, - "cpu_time": 2.5900348441558150e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2783474883565521e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2518406712825033e+06, - "cpu_time": 2.5917676720779017e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2758255985618774e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2530646913068052e+06, - "cpu_time": 2.5895815512986793e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2718813076929962e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2518406712825033e+06, - "cpu_time": 2.5900348441558145e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2758255985618774e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7155396111722534e+03, - "cpu_time": 3.6959813407433940e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7522844975344160e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2052648206906155e-03, - "cpu_time": 1.4272504138322477e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2035791189654438e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2776044199134330e+06, - "cpu_time": 2.6152851525975396e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4387046193581518e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2736974121010923e+06, - "cpu_time": 2.6102423798701470e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4411768173549332e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2681851813859949e+06, - "cpu_time": 2.6121371883117594e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4446792205906583e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2691809957810715e+06, - "cpu_time": 2.6139431136363321e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4440452331005432e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2678999714069553e+06, - "cpu_time": 2.6114069253249858e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4448609027351173e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2713135961177098e+06, - "cpu_time": 2.6126029519481529e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4426933586278809e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2691809957810710e+06, - "cpu_time": 2.6121371883117589e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4440452331005432e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2203329033637037e+03, - "cpu_time": 2.0130790875549978e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6776574731207453e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8581022499831804e-03, - "cpu_time": 7.7052622406856546e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8560128922111459e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 304, - "real_time": 2.3062570598037718e+06, - "cpu_time": 2.6584272861842499e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8416606779114269e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 304, - "real_time": 2.3150029285859903e+06, - "cpu_time": 2.6612464243422542e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8309251444459099e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 304, - "real_time": 2.3062739407913270e+06, - "cpu_time": 2.6584261019735322e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8416398781106349e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 304, - "real_time": 2.3127586985202995e+06, - "cpu_time": 2.6658441644737027e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8336721873289183e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 304, - "real_time": 2.3152245067697214e+06, - "cpu_time": 2.6622287401314797e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8306542112167779e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3111034268942219e+06, - "cpu_time": 2.6612345434210440e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8357104198027339e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3127586985202995e+06, - "cpu_time": 2.6612464243422546e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8336721873289183e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5205239445158286e+03, - "cpu_time": 3.0824183306129357e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5493815984305853e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9560024410464130e-03, - "cpu_time": 1.1582663159972573e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9569634331056372e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 296, - "real_time": 2.3643899971707347e+06, - "cpu_time": 2.7335394459459553e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5435863016187161e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 296, - "real_time": 2.3667127180315955e+06, - "cpu_time": 2.7361905675673834e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5381457580966182e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 296, - "real_time": 2.3718170461408491e+06, - "cpu_time": 2.7403118885137849e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5262272532051086e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 296, - "real_time": 2.3631824289033241e+06, - "cpu_time": 2.7318568682432757e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5464190321026653e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 296, - "real_time": 2.3739181547048124e+06, - "cpu_time": 2.7378721756757367e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5213360974653438e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3680040689902632e+06, - "cpu_time": 2.7359541891892273e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5351428884976901e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3667127180315959e+06, - "cpu_time": 2.7361905675673839e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5381457580966182e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6768718212821159e+03, - "cpu_time": 3.3668647943613187e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0926754971742525e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9750269361979485e-03, - "cpu_time": 1.2305998425211407e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9740691779518249e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 281, - "real_time": 2.4957884934952888e+06, - "cpu_time": 2.8946587295375504e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0503454146183436e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 281, - "real_time": 2.4886539287109496e+06, - "cpu_time": 2.8867162064056844e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0533565835559264e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 281, - "real_time": 2.4892364162951708e+06, - "cpu_time": 2.8881605302492916e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0531100954651761e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 281, - "real_time": 2.4970656292334041e+06, - "cpu_time": 2.8949125195727819e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0498082106094980e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 281, - "real_time": 2.4900050963079589e+06, - "cpu_time": 2.8881098505338789e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0527849938487779e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4921499128085552e+06, - "cpu_time": 2.8905115672598379e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0518810596195444e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4900050963079589e+06, - "cpu_time": 2.8881605302492916e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0527849938487779e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9596130474345605e+03, - "cpu_time": 3.9454948513441204e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6703072828075677e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5888342138183141e-03, - "cpu_time": 1.3649815126269814e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5879240980075278e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 271, - "real_time": 2.5791789987554080e+06, - "cpu_time": 3.0423100036897161e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0327708943543547e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 271, - "real_time": 2.5873319632494031e+06, - "cpu_time": 3.0524785239851647e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0263654121195650e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 271, - "real_time": 2.5791388350398010e+06, - "cpu_time": 3.0438991771216593e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0328025497390848e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 271, - "real_time": 2.5821133255546163e+06, - "cpu_time": 3.0420400885606888e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0304608431056654e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 271, - "real_time": 2.5818936829197449e+06, - "cpu_time": 3.0453061070108232e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0306335751482484e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5819313611037945e+06, - "cpu_time": 3.0452067800736106e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0306066548933840e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5818936829197453e+06, - "cpu_time": 3.0438991771216597e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0306335751482484e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3382156371681522e+03, - "cpu_time": 4.2725051020414821e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6227853827562789e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2929141678425719e-03, - "cpu_time": 1.4030262673782054e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2916265079875781e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 253, - "real_time": 2.7441728230668856e+06, - "cpu_time": 3.3478148221343593e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8211004466843754e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 253, - "real_time": 2.7471647759818514e+06, - "cpu_time": 3.3471983715414423e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8169388642704672e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 253, - "real_time": 2.7424008005736726e+06, - "cpu_time": 3.3453471462449464e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8235694789056808e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 253, - "real_time": 2.7486022530499063e+06, - "cpu_time": 3.3501820237157522e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8149426634445858e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 253, - "real_time": 2.7406724333660053e+06, - "cpu_time": 3.3416291778659346e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8259807601748776e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7446026172076645e+06, - "cpu_time": 3.3464343083004872e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8205064426959974e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7441728230668856e+06, - "cpu_time": 3.3471983715414419e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8211004466843754e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2802747207239854e+03, - "cpu_time": 3.1939858226618535e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5658087673488911e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1951729187161197e-03, - "cpu_time": 9.5444450074501667e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1950794576142528e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 228, - "real_time": 3.0845000159420203e+06, - "cpu_time": 4.0103446184213697e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7990014237672818e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 228, - "real_time": 3.0860544045521109e+06, - "cpu_time": 4.0102803333333642e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7955768923145938e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 228, - "real_time": 3.0911252833902836e+06, - "cpu_time": 4.0108315964913713e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7844289950612617e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 228, - "real_time": 3.0730220289051272e+06, - "cpu_time": 3.9926656491228156e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8243962466718292e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 228, - "real_time": 3.0682325687896656e+06, - "cpu_time": 4.0075169956139685e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8350490159462368e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0805868603158416e+06, - "cpu_time": 4.0063278385965778e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8076905147522414e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0845000159420203e+06, - "cpu_time": 4.0102803333333642e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7990014237672818e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5671362121577422e+03, - "cpu_time": 7.7477429875940488e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1159557625243491e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1056213137184057e-03, - "cpu_time": 1.9338764324159984e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1081844245696546e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 194, - "real_time": 3.6119517567807557e+06, - "cpu_time": 5.0884923659798019e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1612292418153117e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 194, - "real_time": 3.5995690058436743e+06, - "cpu_time": 5.0721921907214765e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1652239457531750e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 194, - "real_time": 3.6053685915473965e+06, - "cpu_time": 5.0809525515461182e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1633495698146739e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 194, - "real_time": 3.6062676178713897e+06, - "cpu_time": 5.0780899639179194e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1630595519906814e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 194, - "real_time": 3.6028655241099522e+06, - "cpu_time": 5.0772609742267309e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1641577993772488e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6052044992306330e+06, - "cpu_time": 5.0793976092784097e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1634040217502182e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6053685915473960e+06, - "cpu_time": 5.0780899639179194e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1633495698146739e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5801807364977267e+03, - "cpu_time": 5.9859344970288694e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4774637289625760e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2704357651487337e-03, - "cpu_time": 1.1784733067745103e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2699489612730478e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 144, - "real_time": 4.8245871019187486e+06, - "cpu_time": 7.4981646249996619e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7387203967493577e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 144, - "real_time": 4.8595072423470104e+06, - "cpu_time": 7.5402460902777892e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7262260516662035e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 144, - "real_time": 4.8569638456683606e+06, - "cpu_time": 7.5427840486115534e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7271300068418884e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 144, - "real_time": 4.8488482845843667e+06, - "cpu_time": 7.5304820555557059e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7300207199036038e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 144, - "real_time": 4.9282586680621738e+06, - "cpu_time": 7.6427743055557720e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7021444215910974e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8636330285161324e+06, - "cpu_time": 7.5508902250000983e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7248483193504305e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8569638456683606e+06, - "cpu_time": 7.5402460902777882e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7271300068418884e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8668935966312252e+04, - "cpu_time": 5.4355713210728507e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3617630818599835e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.9506278001631910e-03, - "cpu_time": 7.1985834240793529e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8949729467969500e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 88, - "real_time": 7.7776112911206754e+06, - "cpu_time": 1.3301786727273619e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1571168025784140e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 88, - "real_time": 7.7867858397605065e+06, - "cpu_time": 1.3311554045454375e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1545752439129629e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 88, - "real_time": 7.7298238069157712e+06, - "cpu_time": 1.3214015636363415e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1704525768090143e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 88, - "real_time": 7.7423674414273016e+06, - "cpu_time": 1.3233186034090687e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1669361635085521e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 88, - "real_time": 7.7762148946269667e+06, - "cpu_time": 1.3281824931818224e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1575041620303397e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7625606547702430e+06, - "cpu_time": 1.3268473475000065e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1613169897678566e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7762148946269657e+06, - "cpu_time": 1.3281824931818226e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1575041620303397e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4896217488681865e+04, - "cpu_time": 4.2880151007653563e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9401806365425391e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2072171279438123e-03, - "cpu_time": 3.2317320518028434e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2110887340445014e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3759192517575096e+07, - "cpu_time": 2.5020629019607835e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4386919477389212e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3744930681936881e+07, - "cpu_time": 2.4962951607841544e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4412223514590793e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3744350194054492e+07, - "cpu_time": 2.5078468745097302e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4413254556417603e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3733366559095243e+07, - "cpu_time": 2.4978808392155964e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4432779723466854e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3722018977882816e+07, - "cpu_time": 2.4944041803921353e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4452984691307540e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3740771786108907e+07, - "cpu_time": 2.4996979913724802e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4419632392634401e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3744350194054490e+07, - "cpu_time": 2.4978808392155968e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4413254556417603e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3927759770080946e+04, - "cpu_time": 5.3596369080182936e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4753440299400808e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0136082591926223e-03, - "cpu_time": 2.1441137795512408e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0136696532281580e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5196381977626257e+07, - "cpu_time": 4.8092221107144237e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6634325539115481e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.3788872241441693e+07, - "cpu_time": 4.5826041142857678e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.8210191436940923e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.5255987686770301e+07, - "cpu_time": 4.8077757178569011e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6571466866509933e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5190713349729776e+07, - "cpu_time": 4.8028395964284495e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6640319020866427e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5335073604115419e+07, - "cpu_time": 4.8164940821428515e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6488521426319780e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4953405771936692e+07, - "cpu_time": 4.7637871242856786e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6908964857950511e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5196381977626257e+07, - "cpu_time": 4.8077757178569004e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6634325539115481e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5358947665203142e+05, - "cpu_time": 1.0140233781301227e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2997697301553831e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6192395644328306e-02, - "cpu_time": 2.1286076637653570e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7127649720790341e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.5607308298349380e+07, - "cpu_time": 8.7541307866664886e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9428995704369950e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.5631233106056847e+07, - "cpu_time": 8.7606219600002080e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9413565854783936e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5454634974400200e+07, - "cpu_time": 8.7257142000006154e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9527842006781197e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.5531158894300461e+07, - "cpu_time": 8.7375848133334935e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9478214756532636e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.4939977178970970e+07, - "cpu_time": 8.6018314733337328e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9865998254846754e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5432862490415573e+07, - "cpu_time": 8.7159766466669068e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9542923315462894e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time_median", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5531158894300461e+07, - "cpu_time": 8.7375848133334935e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9478214756532636e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8410138831553172e+05, - "cpu_time": 6.5268284427685128e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8608124108236168e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.2532134834221639e-03, - "cpu_time": 7.4883500809567330e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2986739360679968e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.6399425752460957e+07, - "cpu_time": 1.6538697225000477e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1069125015840054e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.6130925454199314e+07, - "cpu_time": 1.6509752800000399e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1165978373556700e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.8037856854498386e+07, - "cpu_time": 1.6794608074999928e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0490912158805466e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.6256864480674267e+07, - "cpu_time": 1.6523015299999601e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1120474598301983e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.6397007107734680e+07, - "cpu_time": 1.6535764599998969e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1069994781794744e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6644415929913521e+07, - "cpu_time": 1.6580367599999875e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0983296985659790e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time_median", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6397007107734680e+07, - "cpu_time": 1.6535764599998969e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1069994781794744e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8688905143908877e+05, - "cpu_time": 1.2031268135993171e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7817079431089096e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.0818207150891467e-03, - "cpu_time": 7.2563337715101451e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9780888857515281e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6779451444745064e+08, - "cpu_time": 3.1324641424998844e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1995736795563455e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6670711338520050e+08, - "cpu_time": 3.1107500950000143e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2204439336639667e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6807947680354118e+08, - "cpu_time": 3.1349443975000215e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1941491145139556e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6689658910036087e+08, - "cpu_time": 3.1120036249998862e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2167878019194293e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6843883320689201e+08, - "cpu_time": 3.1401617624999291e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1873345461884432e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6758330538868904e+08, - "cpu_time": 3.1260648044999468e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2036578151684284e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time_median", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6779451444745064e+08, - "cpu_time": 3.1324641424998844e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1995736795563455e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5199981296288152e+05, - "cpu_time": 1.3700182658780720e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4385018145946149e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.4873193736017416e-03, - "cpu_time": 4.3825651467811564e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4901855865620514e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.1992740929126740e+08, - "cpu_time": 5.6015621250003278e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3562045414572372e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.2043918967247009e+08, - "cpu_time": 5.6084988999998581e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3508442743769941e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.1838670372962952e+08, - "cpu_time": 5.5917155049996841e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3724455557409511e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2075943052768707e+08, - "cpu_time": 5.6096561650002742e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3474988474495296e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.1979086995124817e+08, - "cpu_time": 5.5975269599997544e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3576375215580449e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1986072063446045e+08, - "cpu_time": 5.6017919309999800e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3569261481165514e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time_median", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1992740929126740e+08, - "cpu_time": 5.6015621250003278e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3562045414572372e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1164113425165694e+05, - "cpu_time": 7.5267316768419836e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5882997371921986e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8501190532034355e-03, - "cpu_time": 1.3436292831923127e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8562736605247758e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 313, - "real_time": 2.2458794865959557e+06, - "cpu_time": 2.5776135015975614e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8237844124967910e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 313, - "real_time": 2.2381191795019391e+06, - "cpu_time": 2.5701109872205071e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8301080824978701e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 313, - "real_time": 2.2365841151664434e+06, - "cpu_time": 2.5802707252395181e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8313641647656886e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 313, - "real_time": 2.2359016640022541e+06, - "cpu_time": 2.5670168466453711e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8319231413192735e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 313, - "real_time": 2.2445089948443938e+06, - "cpu_time": 2.5828695335463085e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8248980108382078e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2401986880221972e+06, - "cpu_time": 2.5755763188498532e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8284155623835661e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time_median", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2381191795019386e+06, - "cpu_time": 2.5776135015975614e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8301080824978701e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6557525004105610e+03, - "cpu_time": 6.7548678697176856e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7974566648721657e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0782765945287569e-03, - "cpu_time": 2.6226626717604441e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0769111480990190e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 313, - "real_time": 2.2382249828047170e+06, - "cpu_time": 2.5718579137379234e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6600431426400286e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 313, - "real_time": 2.2477263691849983e+06, - "cpu_time": 2.5877156198081407e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6445717380493837e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 313, - "real_time": 2.2435295626152153e+06, - "cpu_time": 2.5770642651756695e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6513893716875436e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 313, - "real_time": 2.2483755701992172e+06, - "cpu_time": 2.5883476070286212e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6435193962164195e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 313, - "real_time": 2.2400428009882998e+06, - "cpu_time": 2.5738107124601165e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6570729793134825e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2435798571584900e+06, - "cpu_time": 2.5797592236420945e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6513193255813713e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time_median", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2435295626152148e+06, - "cpu_time": 2.5770642651756690e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6513893716875436e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5105543115600713e+03, - "cpu_time": 7.7804700012811909e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3413768705515149e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0104273521481522e-03, - "cpu_time": 3.0159675096719891e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0106093759363554e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 311, - "real_time": 2.2576322593393815e+06, - "cpu_time": 2.5997554180065570e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2571606523704678e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 311, - "real_time": 2.2492906089177374e+06, - "cpu_time": 2.5858872411577054e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2840743366119694e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 311, - "real_time": 2.2613014831204698e+06, - "cpu_time": 2.5976807524116589e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2453850679790806e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 311, - "real_time": 2.2501909433058510e+06, - "cpu_time": 2.5868037491961103e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2811598716727439e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 311, - "real_time": 2.2493364009407270e+06, - "cpu_time": 2.5853540482313754e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2839260473212525e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2535503391248332e+06, - "cpu_time": 2.5910962418006817e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2703411951911040e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time_median", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2501909433058510e+06, - "cpu_time": 2.5868037491961103e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2811598716727439e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5662020850032659e+03, - "cpu_time": 7.0155021201159780e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7935482540618854e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4699701570300406e-03, - "cpu_time": 2.7075420846739973e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4669382163910137e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 307, - "real_time": 2.2642139333272991e+06, - "cpu_time": 2.6043652605864150e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4472130710655460e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 307, - "real_time": 2.2637005971216806e+06, - "cpu_time": 2.6050923583061644e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4475412535414295e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 307, - "real_time": 2.2727658817429300e+06, - "cpu_time": 2.6194164788271058e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4417675073013239e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 307, - "real_time": 2.2642483429661696e+06, - "cpu_time": 2.6043021563515607e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4471910778600311e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 307, - "real_time": 2.2782642896369053e+06, - "cpu_time": 2.6194864788274583e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4382879172118504e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2686386089589973e+06, - "cpu_time": 2.6105325465797409e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4444001653960362e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time_median", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2642483429661696e+06, - "cpu_time": 2.6050923583061644e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4471910778600311e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5750334596940493e+03, - "cpu_time": 8.1477908392230065e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1790708277322992e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8982286705907349e-03, - "cpu_time": 3.1211221058699509e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8932915737976610e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 305, - "real_time": 2.2946536853970564e+06, - "cpu_time": 2.6449332721313112e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8560301023664035e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 305, - "real_time": 2.3000978841828029e+06, - "cpu_time": 2.6565414327870100e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8492700441435408e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 305, - "real_time": 2.2939066463684449e+06, - "cpu_time": 2.6435976688524117e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8569602038405567e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 305, - "real_time": 2.3082809751761742e+06, - "cpu_time": 2.6577621967209750e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8391690918389224e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 305, - "real_time": 2.2937996458017924e+06, - "cpu_time": 2.6430737606553938e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8570934745738022e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2981477673852546e+06, - "cpu_time": 2.6491816662294203e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8517045833526451e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time_median", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2946536853970564e+06, - "cpu_time": 2.6449332721313112e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8560301023664035e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.2367205600611751e+03, - "cpu_time": 7.3199736496051919e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7207081717571418e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7138031107360339e-03, - "cpu_time": 2.7631074693430552e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7074011161002474e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 295, - "real_time": 2.3773980595297734e+06, - "cpu_time": 2.7572610440675830e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5132542686572559e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 295, - "real_time": 2.3798409154859642e+06, - "cpu_time": 2.7539143627117001e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5075950307054482e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 295, - "real_time": 2.3732939222038295e+06, - "cpu_time": 2.7413707559324363e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5227883396038510e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 295, - "real_time": 2.3796408129382436e+06, - "cpu_time": 2.7526244474571841e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5080581610196806e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 295, - "real_time": 2.3748076907595838e+06, - "cpu_time": 2.7433743491525031e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5192679605175324e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3769962801834792e+06, - "cpu_time": 2.7497089918642817e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5141927521007538e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time_median", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3773980595297730e+06, - "cpu_time": 2.7526244474571841e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5132542686572559e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9044925723108067e+03, - "cpu_time": 6.9439253037432090e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7395428535621017e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2219171719051283e-03, - "cpu_time": 2.5253309802195762e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2222174952071676e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 279, - "real_time": 2.4805168953380384e+06, - "cpu_time": 2.8798350179216526e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0568119914550136e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 279, - "real_time": 2.4849608228425076e+06, - "cpu_time": 2.8880967885304200e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0549220639226721e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 279, - "real_time": 2.4933754241154077e+06, - "cpu_time": 2.8927200860217265e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0513619307569884e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 279, - "real_time": 2.4806573831786714e+06, - "cpu_time": 2.8801914838708900e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0567521406930175e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 279, - "real_time": 2.4806103547267267e+06, - "cpu_time": 2.8883459318995685e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0567721750435035e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4840241760402704e+06, - "cpu_time": 2.8858378616488511e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0553240603742391e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time_median", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4806573831786709e+06, - "cpu_time": 2.8880967885304200e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0567521406930175e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5590834642417412e+03, - "cpu_time": 5.6274748817451855e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3563987695740294e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2379345248979650e-03, - "cpu_time": 1.9500315511592440e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2328674746015013e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 272, - "real_time": 2.5829145212329049e+06, - "cpu_time": 3.0515097941173841e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0298310133381462e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 272, - "real_time": 2.5911451521096751e+06, - "cpu_time": 3.0577106213234412e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0233833661272579e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 272, - "real_time": 2.5863456984927109e+06, - "cpu_time": 3.0610981176467328e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0271381366595668e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 272, - "real_time": 2.5834986325421864e+06, - "cpu_time": 3.0496045036760978e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0293720824775347e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 272, - "real_time": 2.5816009926048163e+06, - "cpu_time": 3.0526258308829227e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0308637992542654e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5851009993964592e+06, - "cpu_time": 3.0545097735293163e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0281176795713544e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time_median", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5834986325421864e+06, - "cpu_time": 3.0526258308829227e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0293720824775347e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7973468269648811e+03, - "cpu_time": 4.7503287650011171e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9758797295925790e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4689355765408951e-03, - "cpu_time": 1.5551853217717409e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4673111721118350e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 255, - "real_time": 2.7362484950572252e+06, - "cpu_time": 3.3396845647057844e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8321665663559198e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 255, - "real_time": 2.7407741959334589e+06, - "cpu_time": 3.3468237294117920e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8258387048294348e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 255, - "real_time": 2.7434439663136122e+06, - "cpu_time": 3.3524697294122982e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8221156067895931e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 255, - "real_time": 2.7410979537914195e+06, - "cpu_time": 3.3453939019610141e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8253868255588436e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 255, - "real_time": 2.7348517732439088e+06, - "cpu_time": 3.3397104274511137e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8341237000798959e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7392832768679252e+06, - "cpu_time": 3.3448164705884005e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8279262807227379e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time_median", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7407741959334584e+06, - "cpu_time": 3.3453939019610141e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8258387048294348e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5942785667813696e+03, - "cpu_time": 5.3698933905245412e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0239119745473249e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3121237212425283e-03, - "cpu_time": 1.6054373798212913e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3124369713825254e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 227, - "real_time": 3.0761526493429481e+06, - "cpu_time": 3.9996462687227372e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8174510144935167e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 227, - "real_time": 3.0737828805894973e+06, - "cpu_time": 4.0028718325988185e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8227070078476179e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 227, - "real_time": 3.0745032893715319e+06, - "cpu_time": 3.9988887136569405e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8211083307335961e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 227, - "real_time": 3.0716140446815197e+06, - "cpu_time": 4.0103021585904737e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8275244529214382e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 227, - "real_time": 3.0712722728874059e+06, - "cpu_time": 4.0062323612336502e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8282842212110269e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0734650273745810e+06, - "cpu_time": 4.0035882669605250e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8234150054414403e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time_median", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0737828805894973e+06, - "cpu_time": 4.0028718325988189e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8227070078476179e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0394018514422128e+03, - "cpu_time": 4.7488420927429233e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5273617474197928e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.6355134458266900e-04, - "cpu_time": 1.1861464706379974e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6350379447965228e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 195, - "real_time": 3.5907861836350118e+06, - "cpu_time": 5.0657942666662280e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1680740053850930e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 195, - "real_time": 3.5876189800313651e+06, - "cpu_time": 5.0623515846149158e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1691051985579948e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 195, - "real_time": 3.5897137847943949e+06, - "cpu_time": 5.0677218820510460e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1684229583334968e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 195, - "real_time": 3.5874778464532052e+06, - "cpu_time": 5.0638422000002516e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1691511918733490e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 195, - "real_time": 3.5904177607825170e+06, - "cpu_time": 5.0697544769228939e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1681938647400932e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5892029111392992e+06, - "cpu_time": 5.0658928820510665e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1685894437780054e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time_median", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5897137847943949e+06, - "cpu_time": 5.0657942666662280e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1684229583334968e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5595102817094566e+03, - "cpu_time": 2.9585877275533021e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0779937739229260e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.3450045046754704e-04, - "cpu_time": 5.8402098039535256e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3454044540278960e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 143, - "real_time": 4.8442488484136704e+06, - "cpu_time": 7.5392525034966785e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7316633109686320e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 143, - "real_time": 4.8855671339987461e+06, - "cpu_time": 7.5901802587414738e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7170182641895416e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 143, - "real_time": 4.8963073022350986e+06, - "cpu_time": 7.6652550209794892e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7132519431880252e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 143, - "real_time": 4.8896074229916492e+06, - "cpu_time": 7.6699437062928090e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7155994897577131e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 143, - "real_time": 4.9939514593696678e+06, - "cpu_time": 7.7959306643358357e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6797536115937345e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9019364334017672e+06, - "cpu_time": 7.6521124307692572e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7114573239395294e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time_median", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8896074229916492e+06, - "cpu_time": 7.6652550209794892e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7155994897577131e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5331428781341725e+04, - "cpu_time": 9.7143352174072978e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9135761943937324e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1287667543853420e-02, - "cpu_time": 1.2694971885600913e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1180975228695473e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 88, - "real_time": 7.7484439878555182e+06, - "cpu_time": 1.3247744409090437e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1652367915797906e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 88, - "real_time": 7.7285656218670988e+06, - "cpu_time": 1.3185825704544580e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1708059193455992e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 88, - "real_time": 7.7660312209363012e+06, - "cpu_time": 1.3272446295453412e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1603333186158986e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 88, - "real_time": 7.7451456401666459e+06, - "cpu_time": 1.3212195749999141e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1661588793105016e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 88, - "real_time": 7.8064641724763950e+06, - "cpu_time": 1.3315818840908378e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1491440464368224e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7589301286603929e+06, - "cpu_time": 1.3246806199999193e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1623357910577226e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time_median", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7484439878555182e+06, - "cpu_time": 1.3247744409090441e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1652367915797906e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9714833744170348e+04, - "cpu_time": 5.0836855261200166e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2584336143460041e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8297591615637765e-03, - "cpu_time": 3.8376688307860400e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8192188505127272e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3812724026102645e+07, - "cpu_time": 2.5045230509802282e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4292407447358241e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3750559029479822e+07, - "cpu_time": 2.5008776784310542e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4402231158793368e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3781956762221513e+07, - "cpu_time": 2.5005719313724633e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4346638564400315e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3771337073515443e+07, - "cpu_time": 2.5010724372551147e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4365413337046785e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3766182677856848e+07, - "cpu_time": 2.4969645901957810e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4374536344031601e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3776551913835254e+07, - "cpu_time": 2.5008019376469288e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4356245370326066e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time_median", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3771337073515445e+07, - "cpu_time": 2.5008776784310538e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4365413337046785e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3173151184965762e+04, - "cpu_time": 2.6787930811664653e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0929436845771531e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6820719240852910e-03, - "cpu_time": 1.0711736266835325e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6804493559437151e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27, - "real_time": 2.5213825826843578e+07, - "cpu_time": 4.8050849259256952e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6615898936112027e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27, - "real_time": 2.5363983862377979e+07, - "cpu_time": 4.8278263777782977e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6458329402874908e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27, - "real_time": 2.5424457948516916e+07, - "cpu_time": 4.8276012518516399e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6395396171627979e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27, - "real_time": 2.5482265899578732e+07, - "cpu_time": 4.8221731407407045e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6335516733270345e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27, - "real_time": 2.5295734750451867e+07, - "cpu_time": 4.8103522148149185e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6529715251224799e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5356053657553814e+07, - "cpu_time": 4.8186075822222516e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6466971299022012e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time_median", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5363983862377975e+07, - "cpu_time": 4.8221731407407045e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6458329402874908e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0552095951729236e+05, - "cpu_time": 1.0363382855040664e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1022049346026355e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1615687102735189e-03, - "cpu_time": 2.1507007321524339e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1644543387681209e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.4757394740978874e+07, - "cpu_time": 8.5700364666672617e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9987833022173924e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.5578968028227486e+07, - "cpu_time": 8.7345249999998495e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9447294181140232e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5673784613609314e+07, - "cpu_time": 8.7501911199994236e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9386163011332207e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.5763427764177322e+07, - "cpu_time": 8.7588054266673982e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9328600272609582e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.5623139540354408e+07, - "cpu_time": 8.7477921599990323e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9418783834742947e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5479342937469482e+07, - "cpu_time": 8.7122700346665934e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9513734864399776e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time_median", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5623139540354408e+07, - "cpu_time": 8.7477921599990323e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9418783834742947e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0936645389917301e+05, - "cpu_time": 7.9986005271952541e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6867662738106567e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.0011514559922221e-03, - "cpu_time": 9.1808455148524922e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1034438242226772e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.4320518188178539e+07, - "cpu_time": 1.6113371225000605e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1835128835538130e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.6838069371879101e+07, - "cpu_time": 1.6566473225000778e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0912186088619776e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.6680750362575054e+07, - "cpu_time": 1.6560391312501112e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0968289369573646e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.6594729684293270e+07, - "cpu_time": 1.6546728924998888e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0999052364810300e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.4700882434844971e+07, - "cpu_time": 1.6163719462500125e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1692167576470103e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5826990008354202e+07, - "cpu_time": 1.6390136830000299e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1281364847002392e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time_median", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6594729684293270e+07, - "cpu_time": 1.6546728924998888e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0999052364810300e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2122487413776561e+06, - "cpu_time": 2.3047029181986796e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4424739316794194e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4124330135073578e-02, - "cpu_time": 1.4061523354583471e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4201662726059504e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6388786211609840e+08, - "cpu_time": 3.0517799400001878e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2758430372328601e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6888999566435814e+08, - "cpu_time": 3.1417888124997264e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1788200946309757e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6417653858661652e+08, - "cpu_time": 3.0561016699999756e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2700830253937702e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6844015941023827e+08, - "cpu_time": 3.1355923625000060e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1873094509038291e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6424389928579330e+08, - "cpu_time": 3.0594635075004816e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2687418792086487e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6592769101262096e+08, - "cpu_time": 3.0889452585000753e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2361594974740171e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time_median", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6424389928579330e+08, - "cpu_time": 3.0594635075004816e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2687418792086487e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5075056143622203e+06, - "cpu_time": 4.5545387685415689e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8634696570714206e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5112038256299799e-02, - "cpu_time": 1.4744640605101413e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5028522731551395e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.1834575533866882e+08, - "cpu_time": 5.5738726699996734e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3728793489258585e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.2015129923820496e+08, - "cpu_time": 5.5822642150008047e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3538574622528534e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.2027262449264526e+08, - "cpu_time": 5.5875770850002480e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3525869583794460e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2102154195308685e+08, - "cpu_time": 5.5925909000006866e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3447656424157152e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.1909766793251038e+08, - "cpu_time": 5.5813515050010669e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3649315927532821e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1977777779102331e+08, - "cpu_time": 5.5835312750004959e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3578042009454312e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time_median", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2015129923820496e+08, - "cpu_time": 5.5822642150008047e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3538574622528534e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0541084555317182e+06, - "cpu_time": 7.0372379620580818e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1077682242375433e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_coarse/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2963780748410370e-03, - "cpu_time": 1.2603561465781270e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2990852293461230e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - } - ] -} diff --git a/results/implicit_managed_GPUWrGPU_fine.json b/results/implicit_managed_GPUWrGPU_fine.json deleted file mode 100644 index d74c20c..0000000 --- a/results/implicit_managed_GPUWrGPU_fine.json +++ /dev/null @@ -1,25272 +0,0 @@ -{ - "context": { - "date": "2023-10-09T13:47:31-04:00", - "host_name": "frontier10485", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1813, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [0.15,0.21,1.04], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52206, - "real_time": 1.3408338988027817e+04, - "cpu_time": 2.5159836264030950e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0548153680014211e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52206, - "real_time": 1.3404672994724717e+04, - "cpu_time": 2.5087740259740262e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0556508178990585e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52206, - "real_time": 1.3408583843248551e+04, - "cpu_time": 2.4928269490096907e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0547595837739462e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52206, - "real_time": 1.3408001745559683e+04, - "cpu_time": 2.5053653794582995e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0548922037219077e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52206, - "real_time": 1.3407269399245037e+04, - "cpu_time": 2.4987907309504655e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0550590713353199e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3407373394161161e+04, - "cpu_time": 2.5043481423591151e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0550354089463305e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3408001745559683e+04, - "cpu_time": 2.5053653794582991e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0548922037219077e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5886595067256217e+00, - "cpu_time": 8.9391054332386432e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6204052811805479e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1849147927941461e-04, - "cpu_time": 3.5694340104079690e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1850616430102887e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52218, - "real_time": 1.3405557952979376e+04, - "cpu_time": 2.5413845934352154e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1108982026214981e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52218, - "real_time": 1.3407016245593852e+04, - "cpu_time": 2.5308449002259760e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1102335150017142e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52218, - "real_time": 1.3408385882887938e+04, - "cpu_time": 2.5178908173426782e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1096093680111051e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52218, - "real_time": 1.3407479283266401e+04, - "cpu_time": 2.5416279194913619e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1100224933588123e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52218, - "real_time": 1.3409235612929881e+04, - "cpu_time": 2.5293321057872738e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1092222080883181e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3407534995531492e+04, - "cpu_time": 2.5322160672565013e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1099971574162900e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3407479283266401e+04, - "cpu_time": 2.5308449002259757e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1100224933588123e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3961564489515894e+00, - "cpu_time": 9.8495552266213423e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3626180774897999e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0413222485840277e-04, - "cpu_time": 3.8896977844756846e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0413455053357725e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52221, - "real_time": 1.3405009352805546e+04, - "cpu_time": 2.5382720763677386e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2222296582412291e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52221, - "real_time": 1.3405226962366291e+04, - "cpu_time": 2.5264343674000862e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2222098175582025e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52221, - "real_time": 1.3406903606870925e+04, - "cpu_time": 2.5377300511288562e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2220569700824387e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52221, - "real_time": 1.3406928539279836e+04, - "cpu_time": 2.5345417858715809e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2220546974646647e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52221, - "real_time": 1.3405102261884040e+04, - "cpu_time": 2.5678928553646991e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2222211871211259e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3405834144641329e+04, - "cpu_time": 2.5409742272265925e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2221544660935323e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3405226962366291e+04, - "cpu_time": 2.5377300511288558e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2222098175582025e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9071355511580017e-01, - "cpu_time": 1.5773574929326159e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0316928202856856e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.3901671796515182e-05, - "cpu_time": 6.2076878861312221e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3899765298525566e-05, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52209, - "real_time": 1.3406289995379097e+04, - "cpu_time": 2.5714667796740036e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4442258082806306e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52209, - "real_time": 1.3404543206047569e+04, - "cpu_time": 2.5647026432224338e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4445443232423205e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52209, - "real_time": 1.3408732258075201e+04, - "cpu_time": 2.5388598996341610e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4437806176841202e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52209, - "real_time": 1.3408717296278519e+04, - "cpu_time": 2.5380087168878934e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4437833445183082e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52209, - "real_time": 1.3408263388845788e+04, - "cpu_time": 2.5593256622421399e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4438660734588046e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3407309228925234e+04, - "cpu_time": 2.5544727403321263e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4440400334368372e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3408263388845788e+04, - "cpu_time": 2.5593256622421402e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.4438660734588046e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8444380074500117e+00, - "cpu_time": 1.5262896186451238e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3625448077311920e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3756958804759861e-04, - "cpu_time": 5.9749692942375225e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3758141281355128e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52207, - "real_time": 1.3402611610709755e+04, - "cpu_time": 2.5674312640067350e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.8897932659356861e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52207, - "real_time": 1.3400741786027780e+04, - "cpu_time": 2.5661970099795046e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.8904755457888756e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52207, - "real_time": 1.3407377467054546e+04, - "cpu_time": 2.5669232535866846e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.8880551145098429e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52207, - "real_time": 1.3405277729369524e+04, - "cpu_time": 2.5678605761679519e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.8888207557548513e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52207, - "real_time": 1.3403222329999804e+04, - "cpu_time": 2.5571942478977940e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.8895704619712124e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3403846184632284e+04, - "cpu_time": 2.5651212703277342e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.8893430287920942e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3403222329999804e+04, - "cpu_time": 2.5669232535866850e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.8895704619712124e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5529362344929374e+00, - "cpu_time": 4.4744248610293369e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3119901030875242e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9046296110290477e-04, - "cpu_time": 1.7443326804029266e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9045483305735739e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52204, - "real_time": 1.3408478706342143e+04, - "cpu_time": 2.5930801107194915e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.7753073164074612e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52204, - "real_time": 1.3408295211413155e+04, - "cpu_time": 2.5851511455060907e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.7754410932443810e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52204, - "real_time": 1.3412206329176388e+04, - "cpu_time": 2.5728618975557463e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.7725904883278675e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52204, - "real_time": 1.3410492514880249e+04, - "cpu_time": 2.5689126254693085e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.7738393913991489e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52204, - "real_time": 1.3415154860075221e+04, - "cpu_time": 2.6067566450846669e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.7704425604569626e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3410925524377430e+04, - "cpu_time": 2.5853524848670608e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.7735241699671631e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3410492514880247e+04, - "cpu_time": 2.5851511455060903e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 9.7738393913991489e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8557268587903417e+00, - "cpu_time": 1.5363744350521651e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0809642810966265e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1294032642261743e-04, - "cpu_time": 5.9426110909250561e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1291851791712692e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51044, - "real_time": 1.3704197886878168e+04, - "cpu_time": 2.6083063063239559e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9128737206210667e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51044, - "real_time": 1.3713428547952646e+04, - "cpu_time": 2.6266201179374737e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9115861440728981e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51044, - "real_time": 1.3708457037969345e+04, - "cpu_time": 2.6044753565551313e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9122794000369263e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51044, - "real_time": 1.3705736959830143e+04, - "cpu_time": 2.6051696124911807e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9126589162502708e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51044, - "real_time": 1.3715212067294457e+04, - "cpu_time": 2.6383687308988356e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9113375623634239e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3709406499984951e+04, - "cpu_time": 2.6165880248413156e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9121471486689175e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3708457037969343e+04, - "cpu_time": 2.6083063063239555e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.9122794000369263e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7795955709879170e+00, - "cpu_time": 1.5171731801794743e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6660697182552777e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4863621346359249e-04, - "cpu_time": 5.7982883273016740e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4861698394371258e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50884, - "real_time": 1.3754496170446722e+04, - "cpu_time": 2.6210808073264729e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8117572138083778e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50884, - "real_time": 1.3755370174872123e+04, - "cpu_time": 2.6384441828472620e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8115150180236717e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50884, - "real_time": 1.3748201001505608e+04, - "cpu_time": 2.6121692221523499e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8135025807564468e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50884, - "real_time": 1.3756923719621023e+04, - "cpu_time": 2.6300052472289924e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8110845904613564e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50884, - "real_time": 1.3752842324486543e+04, - "cpu_time": 2.6213452578413613e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8122155960918724e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3753566678186407e+04, - "cpu_time": 2.6246089434792877e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8120149998283455e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3754496170446722e+04, - "cpu_time": 2.6213452578413613e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.8117572138083778e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3429574351875275e+00, - "cpu_time": 9.9797294285396703e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2671906475090925e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4306112831732325e-04, - "cpu_time": 3.8023681407219991e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4310477917653504e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50574, - "real_time": 1.3836427180787448e+04, - "cpu_time": 2.6689854154308534e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.5783725545565598e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50574, - "real_time": 1.3826445508715773e+04, - "cpu_time": 2.6457411990350727e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.5838435796026489e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50574, - "real_time": 1.3832257422061126e+04, - "cpu_time": 2.6408645647961515e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.5806570685101746e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50574, - "real_time": 1.3833560858672439e+04, - "cpu_time": 2.6617300727646540e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.5799427978996033e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50574, - "real_time": 1.3836473992501689e+04, - "cpu_time": 2.6596206667457769e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.5783469153214035e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3833032992547698e+04, - "cpu_time": 2.6553883837545021e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.5802325831780792e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3833560858672441e+04, - "cpu_time": 2.6596206667457773e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 7.5799427978996033e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1120581821690321e+00, - "cpu_time": 1.1694207961292804e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2538249828257740e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9726367199328819e-04, - "cpu_time": 4.4039538746336419e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9732926504490420e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50012, - "real_time": 1.3995491688198465e+04, - "cpu_time": 2.6802200051987405e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.4984482479943158e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50012, - "real_time": 1.3995232376423233e+04, - "cpu_time": 2.6934694153403139e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.4984760121117545e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50012, - "real_time": 1.3990609531186954e+04, - "cpu_time": 2.6858621010957333e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.4989711458426208e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50012, - "real_time": 1.3994003922173235e+04, - "cpu_time": 2.6865069763256932e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.4986075548236072e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50012, - "real_time": 1.3999992542811466e+04, - "cpu_time": 2.7151679336959067e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.4979665121870499e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3995066012158673e+04, - "cpu_time": 2.6922452863312774e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.4984938945918698e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3995232376423233e+04, - "cpu_time": 2.6865069763256935e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.4984760121117545e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3714922210100746e+00, - "cpu_time": 1.3649422110635538e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6097887669222973e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4090577479813106e-04, - "cpu_time": 5.0699028724962882e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4089445942690748e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49840, - "real_time": 1.4046538125929390e+04, - "cpu_time": 2.7166903250401418e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.9860054928818872e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49840, - "real_time": 1.4040301013273185e+04, - "cpu_time": 2.6892173214285605e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.9873319639193341e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49840, - "real_time": 1.4042259584547601e+04, - "cpu_time": 2.6788569703049663e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.9869153000244354e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49840, - "real_time": 1.4044268655168613e+04, - "cpu_time": 2.6986351745585969e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.9864880137111304e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49840, - "real_time": 1.4050105103109217e+04, - "cpu_time": 2.7259339947833203e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.9852474193035193e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4044694496405602e+04, - "cpu_time": 2.7018667572231170e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.9863976379680615e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4044268655168615e+04, - "cpu_time": 2.6986351745585969e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 2.9864880137111304e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8107238520145201e+00, - "cpu_time": 1.9357632429252806e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1022952083713174e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7132835484529636e-04, - "cpu_time": 7.1645399898061200e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7130664401020960e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 39672, - "real_time": 1.7614788743148951e+04, - "cpu_time": 3.1032298674127793e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7622529695467645e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 39672, - "real_time": 1.7652412433313249e+04, - "cpu_time": 3.0684633771929974e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7521028820792804e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 39672, - "real_time": 1.7650936486044742e+04, - "cpu_time": 3.0698289675337750e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7525002464499475e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 39672, - "real_time": 1.7658901590939895e+04, - "cpu_time": 3.0705121420649408e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7503566157840033e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 39672, - "real_time": 1.7622588125417966e+04, - "cpu_time": 3.0988133091349086e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7601452977844269e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7639925475772958e+04, - "cpu_time": 3.0821695326678804e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7554716023288849e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7650936486044739e+04, - "cpu_time": 3.0705121420649404e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 4.7525002464499475e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9809710034839533e+01, - "cpu_time": 1.7295924346923442e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3425342717279816e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1230041794704063e-03, - "cpu_time": 5.6116070720977993e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1234499369340352e-03, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27695, - "real_time": 2.5282043896814412e+04, - "cpu_time": 3.8617619895287615e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 6.6360204374591577e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27695, - "real_time": 2.5276965155776379e+04, - "cpu_time": 3.8733737822711584e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 6.6373537711531848e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27695, - "real_time": 2.5286041008955275e+04, - "cpu_time": 3.8570594367214035e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 6.6349714429626208e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27695, - "real_time": 2.5278894553600407e+04, - "cpu_time": 3.8829372810977045e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 6.6368471787507288e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27695, - "real_time": 2.5276976598497193e+04, - "cpu_time": 3.8706265065896034e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 6.6373507664668518e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5280184242728737e+04, - "cpu_time": 3.8691517992417263e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 6.6365087193585095e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5278894553600403e+04, - "cpu_time": 3.8706265065896026e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 6.6368471787507288e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8753975240514791e+00, - "cpu_time": 1.0135012720197156e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0172694519239236e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5329783544461900e-04, - "cpu_time": 2.6194404474343472e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5328382662356448e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15893, - "real_time": 4.4065092176841637e+04, - "cpu_time": 5.7949871075316172e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6147422693091516e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15893, - "real_time": 4.4070609908202736e+04, - "cpu_time": 5.7786367205688497e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6137888878534924e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15893, - "real_time": 4.4055338150207484e+04, - "cpu_time": 5.7912316176933127e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6164282034552869e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15893, - "real_time": 4.4068746756258995e+04, - "cpu_time": 5.8000394324545960e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6141107859470337e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15893, - "real_time": 4.4066481923659710e+04, - "cpu_time": 5.7971274082929602e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6145021193498804e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4065253783034117e+04, - "cpu_time": 5.7924044573082669e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6147144531829688e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4066481923659703e+04, - "cpu_time": 5.7949871075316172e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6145021193498804e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9317610525138083e+00, - "cpu_time": 8.3395941348702323e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0251688555867389e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3461311448971250e-04, - "cpu_time": 1.4397465156888655e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3462998013776025e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8463, - "real_time": 8.2633367111672516e+04, - "cpu_time": 9.7812601205246581e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 8.1212791328359692e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8463, - "real_time": 8.2607561308678414e+04, - "cpu_time": 9.7638835282996006e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 8.1238161418705164e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8463, - "real_time": 8.2565553114741182e+04, - "cpu_time": 9.7554322580644483e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 8.1279494254388330e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8463, - "real_time": 8.2603988699144771e+04, - "cpu_time": 9.7692754460593176e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 8.1241674956423499e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8463, - "real_time": 8.2591490195337523e+04, - "cpu_time": 9.7447221079993978e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 8.1253969193775903e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2600392085914878e+04, - "cpu_time": 9.7629146921894848e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 8.1245218230330518e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2603988699144771e+04, - "cpu_time": 9.7638835282996006e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 8.1241674956423499e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4721869202553549e+01, - "cpu_time": 1.3828498779166316e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4317085215207452e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9929481662556353e-04, - "cpu_time": 1.4164313850073252e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9930481750037790e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4394, - "real_time": 1.5906849982353981e+05, - "cpu_time": 1.7798558056440813e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 8.4377314269570886e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4394, - "real_time": 1.5905557300023371e+05, - "cpu_time": 1.7803682840236847e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 8.4384171813836902e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4394, - "real_time": 1.5901897682445476e+05, - "cpu_time": 1.7820378015475706e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 8.4403591747522363e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4394, - "real_time": 1.5903794276875132e+05, - "cpu_time": 1.7814441966317719e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 8.4393526263829321e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4394, - "real_time": 1.5900635204115152e+05, - "cpu_time": 1.7823362448794034e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 8.4410293222288306e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5903746889162622e+05, - "cpu_time": 1.7812084665453021e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 8.4393779463409558e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5903794276875132e+05, - "cpu_time": 1.7814441966317716e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 8.4393526263829321e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5500573315765884e+01, - "cpu_time": 1.0666357594499455e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3531987999451730e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6034317883380602e-04, - "cpu_time": 5.9882702080274290e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6034342916611250e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2215, - "real_time": 3.1619112009422237e+05, - "cpu_time": 3.5281157246049406e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.4896582775635327e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2215, - "real_time": 3.1607511397356557e+05, - "cpu_time": 3.5365262663656881e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.4927741581847583e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2215, - "real_time": 3.1617140041613788e+05, - "cpu_time": 3.5271476297968306e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.4901877793719202e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2215, - "real_time": 3.1619560203155497e+05, - "cpu_time": 3.5287613137697958e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.4895379402908728e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2215, - "real_time": 3.1606767349718791e+05, - "cpu_time": 3.5302911828442552e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.4929740846271106e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1614018200253375e+05, - "cpu_time": 3.5301684234763018e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.4910264480076392e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1617140041613788e+05, - "cpu_time": 3.5287613137697952e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.4901877793719202e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3505885135440430e+01, - "cpu_time": 3.7334957108874113e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7057762075420985e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0087887826588093e-04, - "cpu_time": 1.0575970500611087e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0089163754075304e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1104, - "real_time": 6.2937274149431766e+05, - "cpu_time": 7.2017887862317229e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.5302536415115332e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1104, - "real_time": 6.3400969072287239e+05, - "cpu_time": 7.2556128985509346e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.4678660256419946e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1104, - "real_time": 6.2999723229660187e+05, - "cpu_time": 7.2072393297100521e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.5217979457287805e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1104, - "real_time": 6.3411391612675472e+05, - "cpu_time": 7.2503270652175159e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.4664742145902283e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1104, - "real_time": 6.2931578361093521e+05, - "cpu_time": 7.2049987047099881e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.5310256945964685e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3136187285029644e+05, - "cpu_time": 7.2239933568840427e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.5034835044138025e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.2999723229660199e+05, - "cpu_time": 7.2072393297100521e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.5217979457287805e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4794177869570603e+03, - "cpu_time": 2.6588516343875026e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3350125817639947e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.9270945769399662e-03, - "cpu_time": 3.6805842738680981e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9219369097769508e-03, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 525, - "real_time": 1.3288359528052667e+06, - "cpu_time": 1.6627989085714577e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.0803188815990051e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 525, - "real_time": 1.3298818930273964e+06, - "cpu_time": 1.6641884857143026e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.0739637830220483e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 525, - "real_time": 1.3295466545969248e+06, - "cpu_time": 1.6636224723809587e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.0759995919475537e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 525, - "real_time": 1.3303332336779151e+06, - "cpu_time": 1.6636852171428646e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.0712245384674939e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 525, - "real_time": 1.3318021806134356e+06, - "cpu_time": 1.6656003752381194e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.0623221648835913e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3300799829441882e+06, - "cpu_time": 1.6639790918095405e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.0727657919839404e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3298818930273966e+06, - "cpu_time": 1.6636852171428646e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.0739637830220483e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1069542077389635e+03, - "cpu_time": 1.0342603607063913e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7154042467665088e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.3224634753819378e-04, - "cpu_time": 6.2155850743392206e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.3185916943542956e-04, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2680315770763410e+06, - "cpu_time": 2.5729911585760554e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8059713283533929e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2740981075912714e+06, - "cpu_time": 2.5737956504854579e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8011536029720767e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2757017486171140e+06, - "cpu_time": 2.5751843430420412e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.7998843664329189e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2735860022417838e+06, - "cpu_time": 2.5730049126213281e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8015592970581686e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2752030999746332e+06, - "cpu_time": 2.5741329449837855e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8002788410606806e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2733241071002288e+06, - "cpu_time": 2.5738218019417333e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8017694871754476e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2740981075912709e+06, - "cpu_time": 2.5737956504854574e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8011536029720767e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0766188129530628e+03, - "cpu_time": 9.0984733676908240e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4420620679161061e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3533568765421171e-03, - "cpu_time": 3.5350051665685573e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3553687557138156e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2684116403249763e+06, - "cpu_time": 2.5748134498382141e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6113374902389413e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2745501486626738e+06, - "cpu_time": 2.5760704368932624e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6015912882010983e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2748996651336597e+06, - "cpu_time": 2.5757139708737382e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6010379383121873e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2682495615640986e+06, - "cpu_time": 2.5695215113267959e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6115955399330524e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2825760718640001e+06, - "cpu_time": 2.5836251941746674e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.5889274845986795e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2737374175098813e+06, - "cpu_time": 2.5759489126213356e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6028979482567925e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2745501486626738e+06, - "cpu_time": 2.5757139708737382e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6015912882010983e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8867144436449544e+03, - "cpu_time": 5.0397427361914106e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3168506229189461e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5890036370566833e-03, - "cpu_time": 1.9564606702789267e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5859324234889201e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 307, - "real_time": 2.2833339198028324e+06, - "cpu_time": 2.5870899185668044e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1754726095492728e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 307, - "real_time": 2.2775582743183700e+06, - "cpu_time": 2.5882912899022931e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1936688447207436e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 307, - "real_time": 2.2779408279587952e+06, - "cpu_time": 2.5833373029315379e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1924607517927866e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 307, - "real_time": 2.2882855897738994e+06, - "cpu_time": 2.5937527068404406e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1599454513974655e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 307, - "real_time": 2.2774034973039785e+06, - "cpu_time": 2.5822575960911736e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1941577412152058e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2809044218315752e+06, - "cpu_time": 2.5869457628664500e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1831410797350947e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2779408279587952e+06, - "cpu_time": 2.5870899185668044e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1924607517927866e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8119685409745498e+03, - "cpu_time": 4.5597587915307004e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5131916286703827e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1096756597589125e-03, - "cpu_time": 1.7626031658577511e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1065876499897274e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 306, - "real_time": 2.2971288641926898e+06, - "cpu_time": 2.6036521568628070e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4264763510129018e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 306, - "real_time": 2.2907236384020913e+06, - "cpu_time": 2.5983501862745751e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4304650046243696e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 306, - "real_time": 2.2990007677839864e+06, - "cpu_time": 2.6062238169934219e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4253148784976343e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 306, - "real_time": 2.2907576210236824e+06, - "cpu_time": 2.6039543921569004e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4304437841554273e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 306, - "real_time": 2.2918268934720093e+06, - "cpu_time": 2.6047866666666949e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4297763977434628e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2938875569748925e+06, - "cpu_time": 2.6033934437908800e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4284952832067592e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2918268934720093e+06, - "cpu_time": 2.6039543921569004e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4297763977434628e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8956453612737860e+03, - "cpu_time": 2.9903229066876861e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4242923804883252e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6982721535013870e-03, - "cpu_time": 1.1486250431411498e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6970951244908207e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 298, - "real_time": 2.3222801809967966e+06, - "cpu_time": 2.6377236107383273e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8220539681766506e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 298, - "real_time": 2.3217814093168150e+06, - "cpu_time": 2.6444451241610488e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8226602098293133e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 298, - "real_time": 2.3305841101233489e+06, - "cpu_time": 2.6460582080536918e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8119989197270989e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 298, - "real_time": 2.3217577856009039e+06, - "cpu_time": 2.6436849899329143e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8226889301908102e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 298, - "real_time": 2.3225588574005454e+06, - "cpu_time": 2.6439395033557257e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8217153589532372e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3237924686876819e+06, - "cpu_time": 2.6431702872483418e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8202234773754224e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3222801809967966e+06, - "cpu_time": 2.6439395033557257e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8220539681766506e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8118072915578814e+03, - "cpu_time": 3.1815166591042639e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6161639472076815e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6403389471825458e-03, - "cpu_time": 1.2036744943952759e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6368078573346290e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 294, - "real_time": 2.3894181861510486e+06, - "cpu_time": 2.7251249625850408e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4855194774898306e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 294, - "real_time": 2.3812597964377124e+06, - "cpu_time": 2.7215532925170804e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5043133133175753e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 294, - "real_time": 2.3885779011500431e+06, - "cpu_time": 2.7283646802721103e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4874492448788032e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 294, - "real_time": 2.3815912316508945e+06, - "cpu_time": 2.7224424387754519e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5035473030836716e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 294, - "real_time": 2.3812853547484698e+06, - "cpu_time": 2.7202034761904497e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5042542355804674e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3844264940276342e+06, - "cpu_time": 2.7235377700680266e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4970167148700692e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3815912316508950e+06, - "cpu_time": 2.7224424387754519e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5035473030836716e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1858276866539218e+03, - "cpu_time": 3.2432105875310035e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6435676337261204e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7554861502916224e-03, - "cpu_time": 1.1908080083097201e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7543275077987572e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 280, - "real_time": 2.4961793678812683e+06, - "cpu_time": 2.8703307785713756e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0501809420150170e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 280, - "real_time": 2.5017519323487901e+06, - "cpu_time": 2.8685279714285424e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0478417008911191e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 280, - "real_time": 2.5021519187638271e+06, - "cpu_time": 2.8670953321428625e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0476741960956179e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 280, - "real_time": 2.4967410543467849e+06, - "cpu_time": 2.8702223178571886e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0499446850670062e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 280, - "real_time": 2.4979193520266563e+06, - "cpu_time": 2.8670293321427819e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0494494139184785e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4989487250734651e+06, - "cpu_time": 2.8686411464285506e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0490181875974478e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4979193520266563e+06, - "cpu_time": 2.8685279714285424e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0494494139184785e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8160779021268436e+03, - "cpu_time": 1.6089791433435271e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1818191129568010e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1269050356541650e-03, - "cpu_time": 5.6088547197571275e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1265954460365510e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 270, - "real_time": 2.5956279486072836e+06, - "cpu_time": 3.0303297740740869e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0198888684386113e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 270, - "real_time": 2.5906542954207570e+06, - "cpu_time": 3.0284169000000078e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0237667408064902e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 270, - "real_time": 2.5968776851961459e+06, - "cpu_time": 3.0308198444444132e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0189168053188449e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 270, - "real_time": 2.5918354056085702e+06, - "cpu_time": 3.0311001555556110e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0228445018749011e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 270, - "real_time": 2.5937754850558662e+06, - "cpu_time": 3.0298591518518208e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0213314645801258e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5937541639777245e+06, - "cpu_time": 3.0301051651851879e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0213496762037948e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5937754850558657e+06, - "cpu_time": 3.0303297740740869e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0213314645801258e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5767579909166275e+03, - "cpu_time": 1.0561703612773179e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0080996496688106e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.9344726909853616e-04, - "cpu_time": 3.4855897855042559e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9344496071562035e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 255, - "real_time": 2.7617367185360077e+06, - "cpu_time": 3.3359385568627766e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7967992856170899e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 255, - "real_time": 2.7580749042624352e+06, - "cpu_time": 3.3257413450980145e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8018401834536481e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 255, - "real_time": 2.7533614934951649e+06, - "cpu_time": 3.3254944156862851e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8083484587013650e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 255, - "real_time": 2.7576055770338164e+06, - "cpu_time": 3.3249432196078477e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8024872328837085e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 255, - "real_time": 2.7538289325129166e+06, - "cpu_time": 3.3230639882353498e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8077020239712429e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7569215251680678e+06, - "cpu_time": 3.3270363050980549e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8034354369254112e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7576055770338168e+06, - "cpu_time": 3.3254944156862851e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8024872328837085e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4359224490492525e+03, - "cpu_time": 5.0858809211479329e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7387755992450204e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2462895362390816e-03, - "cpu_time": 1.5286520659106666e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2459198211277412e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 227, - "real_time": 3.0871477421159786e+06, - "cpu_time": 3.9890835374448635e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7931701855078042e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 227, - "real_time": 3.0905155040372969e+06, - "cpu_time": 3.9882405726873185e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7857676082206488e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 227, - "real_time": 3.0862878349564541e+06, - "cpu_time": 3.9783895418502009e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7950629110054779e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 227, - "real_time": 3.0843953269693819e+06, - "cpu_time": 3.9791659471364915e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7992321920049965e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 227, - "real_time": 3.0869969006808321e+06, - "cpu_time": 3.9818324713657238e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7935021234957397e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0870686617519888e+06, - "cpu_time": 3.9833424140969203e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7933470040469337e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0869969006808321e+06, - "cpu_time": 3.9818324713657238e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7935021234957397e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2163333706748595e+03, - "cpu_time": 5.0300646538104784e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8755087414545775e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1794106756829790e-04, - "cpu_time": 1.2627748586235626e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1768875320959448e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 193, - "real_time": 3.6209996987539562e+06, - "cpu_time": 5.0403765129534798e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1583276301965249e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 193, - "real_time": 3.6146112819023700e+06, - "cpu_time": 5.0320222746113818e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1603748433476193e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 193, - "real_time": 3.6203596340444111e+06, - "cpu_time": 5.0416739015544336e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1585324177627122e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 193, - "real_time": 3.6237942153790607e+06, - "cpu_time": 5.0717535336787906e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1574343769852455e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 193, - "real_time": 3.6224702776076724e+06, - "cpu_time": 5.0438028290155772e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1578573952496233e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6204470215374939e+06, - "cpu_time": 5.0459258103627330e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1585053327083452e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6209996987539558e+06, - "cpu_time": 5.0416739015544336e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1583276301965249e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5237131519923955e+03, - "cpu_time": 1.5114232350086266e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1285112896555355e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.7328123599941033e-04, - "cpu_time": 2.9953338432060230e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7410970652790196e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 142, - "real_time": 4.9251851258458383e+06, - "cpu_time": 7.6339570915492484e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7032066380569527e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 142, - "real_time": 4.9338138688513087e+06, - "cpu_time": 7.6326541549296817e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7002279013725820e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 142, - "real_time": 4.9759062649813341e+06, - "cpu_time": 7.7036550704224445e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6858452618040764e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 142, - "real_time": 5.0004009373853328e+06, - "cpu_time": 7.7405190915493928e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6775870785246139e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 142, - "real_time": 4.9794723811021578e+06, - "cpu_time": 7.7186427816900667e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6846379210448124e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9629557156331949e+06, - "cpu_time": 7.6858856380281672e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6903009601606073e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9759062649813341e+06, - "cpu_time": 7.7036550704224454e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6858452618040764e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2087872652362323e+04, - "cpu_time": 4.9758823751130301e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0939226777033193e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.4654763191390706e-03, - "cpu_time": 6.4740520604332141e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4717627421768606e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 87, - "real_time": 8.0314165131113995e+06, - "cpu_time": 1.3849660379310342e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0889485650023208e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 87, - "real_time": 8.0344711280502807e+06, - "cpu_time": 1.3843836195402263e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0881543704135900e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 87, - "real_time": 8.0653970590096777e+06, - "cpu_time": 1.3868216954022856e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0801475584216328e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 87, - "real_time": 8.0137482854997972e+06, - "cpu_time": 1.3812025137930969e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0935541524753103e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 87, - "real_time": 8.0297188672783049e+06, - "cpu_time": 1.3839730954023199e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0893902112025852e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0349503705898924e+06, - "cpu_time": 1.3842693924137929e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0880389715030878e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0314165131113995e+06, - "cpu_time": 1.3843836195402261e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0889485650023208e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8818977767324181e+04, - "cpu_time": 2.0313880567092219e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8825748215137469e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3421398887797451e-03, - "cpu_time": 1.4674802952675480e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3383542587804263e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52, - "real_time": 1.3636946552791275e+07, - "cpu_time": 2.5078119653846130e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4605531648968678e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52, - "real_time": 1.3616958973356165e+07, - "cpu_time": 2.5039596769231088e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4641648745255680e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52, - "real_time": 1.3674672943754839e+07, - "cpu_time": 2.5113313384615310e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4537648642868757e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52, - "real_time": 1.3637275811141500e+07, - "cpu_time": 2.5090465884615626e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4604937573079228e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52, - "real_time": 1.3615436010205975e+07, - "cpu_time": 2.5009344442307882e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4644405052359676e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3636258058249954e+07, - "cpu_time": 2.5066168026923213e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4606834332506404e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3636946552791277e+07, - "cpu_time": 2.5078119653846134e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4605531648968678e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3891555183876579e+04, - "cpu_time": 4.1505612662176623e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3056813214170877e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7520609452988580e-03, - "cpu_time": 1.6558419546855363e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7497908358447990e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.4677511371139970e+07, - "cpu_time": 4.7650800678571925e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7194340219606972e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.4713819979556970e+07, - "cpu_time": 4.7734160642856896e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7154387324789042e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.4691563166145768e+07, - "cpu_time": 4.7706590357143290e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7178864111775622e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.4747843388468027e+07, - "cpu_time": 4.7709367000000007e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7117055392095828e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.4648060423455067e+07, - "cpu_time": 4.7688743642856322e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7226833611678133e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4695759665753163e+07, - "cpu_time": 4.7697932464285694e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7174296131989121e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4691563166145768e+07, - "cpu_time": 4.7706590357143290e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7178864111775622e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7632159409449538e+04, - "cpu_time": 3.0919364075085090e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1399521637429581e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5238308081543216e-03, - "cpu_time": 6.4823279495890675e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5234809187456659e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 16, - "real_time": 4.4865284115076065e+07, - "cpu_time": 8.6854618937499240e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9915720060022726e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 16, - "real_time": 4.4895373983308673e+07, - "cpu_time": 8.6884674687500045e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9895669885699100e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 16, - "real_time": 4.4954963726922870e+07, - "cpu_time": 8.6977562187499300e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9856041885674787e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 16, - "real_time": 4.4884554110467434e+07, - "cpu_time": 8.6879119875000298e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9902876537365303e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 16, - "real_time": 4.4894854305312037e+07, - "cpu_time": 8.6938592187499002e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9896015941434770e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4899006048217423e+07, - "cpu_time": 8.6906913574999586e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9893264862039337e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4894854305312037e+07, - "cpu_time": 8.6884674687500045e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9896015941434770e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3569770429439443e+04, - "cpu_time": 4.9991369079356380e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2335637249203348e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.4767290824631139e-04, - "cpu_time": 5.7522890898909277e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4717958551147692e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.5385767742991447e+07, - "cpu_time": 1.6427983112500045e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1437962449196749e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.5537827573716640e+07, - "cpu_time": 1.6440997012499991e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1382075464643040e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.5571028292179108e+07, - "cpu_time": 1.6449612049999729e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1369899527610803e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.4149570204317570e+07, - "cpu_time": 1.6095250350000611e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1899801193069792e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.5408887825906277e+07, - "cpu_time": 1.6413141125000408e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1429452230682015e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5210616327822223e+07, - "cpu_time": 1.6365396730000159e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1503838173040481e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5408887825906277e+07, - "cpu_time": 1.6427983112500045e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1429452230682015e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9849236939185741e+05, - "cpu_time": 1.5164372060174409e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2328530546072215e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.0236831416561774e-03, - "cpu_time": 9.2661194289142441e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0875587994798468e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6324449330568314e+08, - "cpu_time": 3.0626629100000000e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2887535813822737e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6686973348259926e+08, - "cpu_time": 3.1102523375000149e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2173055040924091e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6362877190113068e+08, - "cpu_time": 3.0655581949999088e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2810300154571424e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6656213626265526e+08, - "cpu_time": 3.1099767700000316e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2232470358893404e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6358525678515434e+08, - "cpu_time": 3.0608791125000322e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2819027982766356e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6477807834744453e+08, - "cpu_time": 3.0818658649999976e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2584477870195608e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6362877190113068e+08, - "cpu_time": 3.0655581949999088e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2810300154571424e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7785876079481896e+06, - "cpu_time": 2.5841595166380615e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5036823810129821e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0793836326928940e-02, - "cpu_time": 8.3850486355870751e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0752611703555123e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.1889098882675171e+08, - "cpu_time": 5.5907886150001216e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3671124667098904e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.1768803298473358e+08, - "cpu_time": 5.5810186300001872e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3798623571432996e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.1648266315460205e+08, - "cpu_time": 5.5795526299999666e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3927350499938006e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.1766185164451599e+08, - "cpu_time": 5.5723149450000167e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3801409216791511e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.1792633235454559e+08, - "cpu_time": 5.5693684150000417e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3773290058987088e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1772997379302979e+08, - "cpu_time": 5.5786086470000672e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3794359602849703e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1768803298473358e+08, - "cpu_time": 5.5795526299999666e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3798623571432996e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5858838805798313e+05, - "cpu_time": 8.3672473779027432e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1358130809600092e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7022580772227359e-03, - "cpu_time": 1.4998806884226024e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7033544024280412e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2709321194482083e+06, - "cpu_time": 2.5784677508090972e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8036646559894744e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2674260893083122e+06, - "cpu_time": 2.5753592912622206e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8064535904010446e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2674043433782929e+06, - "cpu_time": 2.5878532880258933e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8064709155038539e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2676870706084282e+06, - "cpu_time": 2.5751703624594640e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8062456910781031e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2676606386791444e+06, - "cpu_time": 2.5813569190939404e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8062667447391148e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2682220522844773e+06, - "cpu_time": 2.5796415223301230e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8058203195423183e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2676606386791440e+06, - "cpu_time": 2.5784677508090972e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8062667447391148e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5205311223442145e+03, - "cpu_time": 5.2460031210936768e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2094863406636525e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7036255150274482e-04, - "cpu_time": 2.0336171036489975e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6977114365962748e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2689748106391304e+06, - "cpu_time": 2.5794901850648466e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6104411391382781e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2689161161505072e+06, - "cpu_time": 2.5851680779222110e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6105345374771836e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2754060269285040e+06, - "cpu_time": 2.5853904772728872e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6002365745062702e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2756169125280501e+06, - "cpu_time": 2.5860859383116476e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.5999029339693496e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2683794883853914e+06, - "cpu_time": 2.5852130681817634e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6113886772230426e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2714586709263166e+06, - "cpu_time": 2.5842695493506715e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6065007724628248e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2689748106391300e+06, - "cpu_time": 2.5852130681817634e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6104411391382781e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7076982233911926e+03, - "cpu_time": 2.6970193090661255e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8834728582305161e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6322983424035479e-03, - "cpu_time": 1.0436292567637861e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6313521691589106e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 307, - "real_time": 2.2752644207498441e+06, - "cpu_time": 2.5944403224755079e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2009212865906954e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 307, - "real_time": 2.2753467661986910e+06, - "cpu_time": 2.5940793550487766e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2006606831942089e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 307, - "real_time": 2.2811812943254113e+06, - "cpu_time": 2.5945149902280071e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1822437088872669e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 307, - "real_time": 2.2813829908857322e+06, - "cpu_time": 2.5937236677524163e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1816087283262415e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 307, - "real_time": 2.2752435539670121e+06, - "cpu_time": 2.5961047882737350e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2009873278988516e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2776838052253383e+06, - "cpu_time": 2.5945726247556889e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1932843469794532e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2753467661986910e+06, - "cpu_time": 2.5944403224755083e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2006606831942089e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2858181404463676e+03, - "cpu_time": 9.1274225248292601e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0371654376325559e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4426138223875599e-03, - "cpu_time": 3.5178905526642260e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4418524106697857e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 306, - "real_time": 2.2892185906861341e+06, - "cpu_time": 2.6125719281045566e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4314054644374803e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 306, - "real_time": 2.2951763083707858e+06, - "cpu_time": 2.6128547483660239e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4276898851077862e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 306, - "real_time": 2.2895574551440920e+06, - "cpu_time": 2.6127773464051401e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4311936102052422e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 306, - "real_time": 2.2895705667050444e+06, - "cpu_time": 2.6121787026143917e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4311854142655633e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 306, - "real_time": 2.2964437600237383e+06, - "cpu_time": 2.6142740555556454e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4269019154930785e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2919933361859592e+06, - "cpu_time": 2.6129313562091524e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4296752579018302e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2895705667050448e+06, - "cpu_time": 2.6127773464051401e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4311854142655633e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5156836199250115e+03, - "cpu_time": 7.9500083418544511e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1916154922831753e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5338978366208345e-03, - "cpu_time": 3.0425630290526829e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5329463667851095e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 301, - "real_time": 2.3267314911656007e+06, - "cpu_time": 2.6616241362126777e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8166550480291583e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 301, - "real_time": 2.3273220394066600e+06, - "cpu_time": 2.6585244285714198e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8159403335822016e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 301, - "real_time": 2.3278844623247851e+06, - "cpu_time": 2.6605173089700826e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8152599951009281e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 301, - "real_time": 2.3275453270880189e+06, - "cpu_time": 2.6591571860464993e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8156701928547092e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 301, - "real_time": 2.3274682400333523e+06, - "cpu_time": 2.6525971362127354e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8157634494321123e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3273903120036838e+06, - "cpu_time": 2.6584840392026836e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8158578037998226e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3274682400333527e+06, - "cpu_time": 2.6591571860464998e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8157634494321123e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2219457477477556e+02, - "cpu_time": 3.5037401432479210e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1085354126696629e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8140256604028837e-04, - "cpu_time": 1.3179466536495520e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8142021964944453e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 294, - "real_time": 2.3916324966454082e+06, - "cpu_time": 2.7393071054420881e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4804406690344952e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 294, - "real_time": 2.3829424278620556e+06, - "cpu_time": 2.7351780680271611e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5004266350486726e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 294, - "real_time": 2.3896396001737542e+06, - "cpu_time": 2.7370307993196873e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4850112121706374e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 294, - "real_time": 2.3860901872925209e+06, - "cpu_time": 2.7372723027209463e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4931704047920525e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 294, - "real_time": 2.3853914102628119e+06, - "cpu_time": 2.7320585034013125e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4947795752127349e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3871392244473104e+06, - "cpu_time": 2.7361693557822397e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4907656992517188e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3860901872925209e+06, - "cpu_time": 2.7370307993196873e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4931704047920525e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4716641818321768e+03, - "cpu_time": 2.7242342295283224e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9835433862414749e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4543199434192886e-03, - "cpu_time": 9.9563801625484369e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4539945471229033e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 279, - "real_time": 2.4956063898180122e+06, - "cpu_time": 2.8756287741936329e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0504220580198002e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 279, - "real_time": 2.5071183630135111e+06, - "cpu_time": 2.8829076272400245e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0455988192153306e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 279, - "real_time": 2.4965245420226702e+06, - "cpu_time": 2.8758255125446883e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0500357420384596e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 279, - "real_time": 2.4984915637307698e+06, - "cpu_time": 2.8774234623657195e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0492090660036661e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 279, - "real_time": 2.5003817296289844e+06, - "cpu_time": 2.8763244480285714e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0484159154326323e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4996245176427895e+06, - "cpu_time": 2.8776219648745274e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0487363201419778e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4984915637307698e+06, - "cpu_time": 2.8763244480285714e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0492090660036661e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5762941628143399e+03, - "cpu_time": 3.0356724917214965e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9170465142374611e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8307926372597371e-03, - "cpu_time": 1.0549240062719151e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8279585415502074e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 270, - "real_time": 2.5990339203013312e+06, - "cpu_time": 3.0414277962963581e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0172418524619108e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 270, - "real_time": 2.5978795468324311e+06, - "cpu_time": 3.0429885407407391e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0181382182990706e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 270, - "real_time": 2.6038392645272394e+06, - "cpu_time": 3.0506841259260136e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0135190644926053e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 270, - "real_time": 2.5973681394976596e+06, - "cpu_time": 3.0430180740739633e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0185355784852245e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 270, - "real_time": 2.6011607471715519e+06, - "cpu_time": 3.0432662037037937e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0155924641339442e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5998563236660426e+06, - "cpu_time": 3.0442769481481733e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0166054355745512e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5990339203013312e+06, - "cpu_time": 3.0430180740739629e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0172418524619108e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6617847858117211e+03, - "cpu_time": 3.6549950500771856e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0634739266586336e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0238199555806043e-03, - "cpu_time": 1.2006118734698267e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0232412797552184e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 253, - "real_time": 2.7588475550793614e+06, - "cpu_time": 3.3445616442686571e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8007754291078854e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 253, - "real_time": 2.7606373076721025e+06, - "cpu_time": 3.3478196521740318e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7983113431304306e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 253, - "real_time": 2.7561547674547895e+06, - "cpu_time": 3.3453019604743882e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8044888203731841e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 253, - "real_time": 2.7624826819411381e+06, - "cpu_time": 3.3522005138341519e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7957740218779868e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 253, - "real_time": 2.7528485207792679e+06, - "cpu_time": 3.3420563122530864e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8090581159299397e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7581941665853322e+06, - "cpu_time": 3.3463880166008631e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8016815460838860e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7588475550793614e+06, - "cpu_time": 3.3453019604743887e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8007754291078854e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7921727524655371e+03, - "cpu_time": 3.8442658875658294e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2290708968228765e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3748751985652552e-03, - "cpu_time": 1.1487806759093919e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3754626297432370e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 226, - "real_time": 3.1007014460185855e+06, - "cpu_time": 4.0112318451328310e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7634760602083123e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 226, - "real_time": 3.0998193238556911e+06, - "cpu_time": 4.0068719867256945e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7654007569430542e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 226, - "real_time": 3.1034412960711438e+06, - "cpu_time": 4.0101629469027268e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7575049757020581e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 226, - "real_time": 3.0983297836315711e+06, - "cpu_time": 4.0062753849557173e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7686532630555403e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 226, - "real_time": 3.0961831963612838e+06, - "cpu_time": 4.0101514646017873e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7733459779273665e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0996950091876551e+06, - "cpu_time": 4.0089387256637514e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7656762067672658e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0998193238556911e+06, - "cpu_time": 4.0101514646017877e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7654007569430542e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7046120234773662e+03, - "cpu_time": 2.2131789257187966e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9028338211404870e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7254133566714047e-04, - "cpu_time": 5.5206105085888163e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7246767961438444e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 192, - "real_time": 3.6257040034494516e+06, - "cpu_time": 5.0836759218748640e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1568247148718121e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 192, - "real_time": 3.6269573623333904e+06, - "cpu_time": 5.0873872968750792e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1564249537528639e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 192, - "real_time": 3.6237131813929104e+06, - "cpu_time": 5.0828158749999609e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1574602596963155e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 192, - "real_time": 3.6232848360668868e+06, - "cpu_time": 5.0802663645835491e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1575970948375564e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 192, - "real_time": 3.6222656878332295e+06, - "cpu_time": 5.0803838593749264e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1579227923805206e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6243850142151741e+06, - "cpu_time": 5.0829058635416757e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1572459631078138e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6237131813929109e+06, - "cpu_time": 5.0828158749999609e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1574602596963155e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9045998956675958e+03, - "cpu_time": 2.9159814917223921e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0803388458210125e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.2549601882735371e-04, - "cpu_time": 5.7368394575983532e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2541456524005548e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 142, - "real_time": 5.0210390849904697e+06, - "cpu_time": 7.8226240845073732e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6706916353382504e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 142, - "real_time": 4.9976057759945244e+06, - "cpu_time": 7.8008837112674778e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6785253531388569e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 142, - "real_time": 5.0027843820534544e+06, - "cpu_time": 7.7348718802814921e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6767878364081709e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 142, - "real_time": 5.0064532617500555e+06, - "cpu_time": 7.7389587112677451e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6755590357928717e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 142, - "real_time": 4.9919404325560788e+06, - "cpu_time": 7.7179774999997718e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6804303082808800e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0039645874689166e+06, - "cpu_time": 7.7630631774647729e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6763988337918060e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0027843820534544e+06, - "cpu_time": 7.7389587112677451e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6767878364081709e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1001586645343930e+04, - "cpu_time": 4.5788610114555726e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6811536572547471e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1985740412501010e-03, - "cpu_time": 5.8982658092329443e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1958698509282749e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 87, - "real_time": 7.9278984406813122e+06, - "cpu_time": 1.3470304022988152e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1162248892984293e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 87, - "real_time": 7.8675469180205092e+06, - "cpu_time": 1.3392337609195562e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1324583348301382e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 87, - "real_time": 7.9656272709112745e+06, - "cpu_time": 1.3532880413793426e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1062014866383111e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 87, - "real_time": 7.8963617708576825e+06, - "cpu_time": 1.3445889942529028e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1246767165503998e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 87, - "real_time": 7.9993359776663370e+06, - "cpu_time": 1.3653429620689917e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0973260839200871e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9313540756274220e+06, - "cpu_time": 1.3498968321839217e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1153775022474732e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9278984406813113e+06, - "cpu_time": 1.3470304022988152e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1162248892984293e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2687633956274520e+04, - "cpu_time": 1.0002173274009576e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4044583112998405e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.6429557240648817e-03, - "cpu_time": 7.4095834848561170e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6392797966683499e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3835366669238782e+07, - "cpu_time": 2.5413161098039798e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4252651051601043e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3824671726016438e+07, - "cpu_time": 2.5360547117646974e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4271413213273215e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3857663298646608e+07, - "cpu_time": 2.5418534745097969e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4213629150072546e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3742121046080308e+07, - "cpu_time": 2.5126377862746127e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4417214698869791e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3828533975517049e+07, - "cpu_time": 2.5303910235293768e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4264634312940898e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3817671343099838e+07, - "cpu_time": 2.5324506211764928e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4283908485351501e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3828533975517049e+07, - "cpu_time": 2.5360547117646974e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4264634312940898e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4122926577713013e+04, - "cpu_time": 1.2008230278566713e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7804858847555276e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1932244936298025e-03, - "cpu_time": 4.7417431077049340e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2039677177373898e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27, - "real_time": 2.5038356375363138e+07, - "cpu_time": 4.7366660148148403e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6802423846811590e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27, - "real_time": 2.5280863253606692e+07, - "cpu_time": 4.8125969444444962e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6545321386691937e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27, - "real_time": 2.5525201870887369e+07, - "cpu_time": 4.8405420148147486e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6291217730403399e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27, - "real_time": 2.5477195779482525e+07, - "cpu_time": 4.8371140259260096e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6340757664563928e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27, - "real_time": 2.5436211860290281e+07, - "cpu_time": 4.8329246518518530e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6383199026882987e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5351565827926002e+07, - "cpu_time": 4.8119687303703897e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6472583931070771e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5436211860290281e+07, - "cpu_time": 4.8329246518518522e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6383199026882987e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9760840450731851e+05, - "cpu_time": 4.3470572634333197e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0757325926490627e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7947218664356855e-03, - "cpu_time": 9.0338435409964002e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8410653000623165e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.6046816060940422e+07, - "cpu_time": 8.8338758266669020e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9148101754173455e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.5945120354493462e+07, - "cpu_time": 8.8072516666666925e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9212618655568161e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.6058953801790871e+07, - "cpu_time": 8.8199142266667739e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9140420465820765e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.7303801029920578e+07, - "cpu_time": 9.0619359866665646e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.8373560914291997e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.5932351549466453e+07, - "cpu_time": 8.8254271800000578e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9220739516341848e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6257408559322357e+07, - "cpu_time": 8.8696809773333982e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9019088261239243e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6046816060940422e+07, - "cpu_time": 8.8254271800000578e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9148101754173455e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8776200034892594e+05, - "cpu_time": 1.0790799820762235e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6269435586278431e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2706332210442709e-02, - "cpu_time": 1.2165939055010304e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2498475231120017e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.7924063205718994e+07, - "cpu_time": 1.6732156887499627e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0530374304009609e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.7461424991488457e+07, - "cpu_time": 1.6743349149999887e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0691868561039739e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.8530085049569607e+07, - "cpu_time": 1.6878691362499866e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0321382369586349e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.7657685391604900e+07, - "cpu_time": 1.6705459424999702e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0623151273135080e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.7790005840361118e+07, - "cpu_time": 1.6738151012500423e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0576994890298529e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7872652895748630e+07, - "cpu_time": 1.6759561567499903e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0548754279613862e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7790005840361118e+07, - "cpu_time": 1.6738151012500423e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0576994890298529e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0528076986555080e+05, - "cpu_time": 6.8174813369816565e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4040116742534585e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6121376390715384e-03, - "cpu_time": 4.0678160401296532e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5959703017756093e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7007119208574295e+08, - "cpu_time": 3.1637174875000083e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1567422172788181e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6954314708709717e+08, - "cpu_time": 3.1390990174999446e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1665739442963176e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7024963721632957e+08, - "cpu_time": 3.1613741175000596e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1534335155018220e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6989164054393768e+08, - "cpu_time": 3.1412480000000185e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1600784493051820e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7019000276923180e+08, - "cpu_time": 3.1610953950000465e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1545384761992583e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6998912394046783e+08, - "cpu_time": 3.1533068035000157e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1582733205162797e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7007119208574295e+08, - "cpu_time": 3.1610953950000465e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1567422172788181e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8432068934398238e+05, - "cpu_time": 1.2056139296604902e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2885701482650302e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6725816496563322e-03, - "cpu_time": 3.8233321550643850e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6745131315615562e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.2319130003452301e+08, - "cpu_time": 5.6249415499999595e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3223104207486520e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.2354488968849182e+08, - "cpu_time": 5.6422556850000656e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3186795966204128e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.2397209107875824e+08, - "cpu_time": 5.6410475249998629e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3143034649209065e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2224640250205994e+08, - "cpu_time": 5.6302313300000155e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3320521677294326e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.2512977719306946e+08, - "cpu_time": 5.6622488099998236e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3025022600817881e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2361689209938049e+08, - "cpu_time": 5.6401449799999452e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3179695820202389e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2354488968849182e+08, - "cpu_time": 5.6410475249998629e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3186795966204128e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0582464636021932e+06, - "cpu_time": 1.4346373267876832e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0843715741962254e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2700594111051938e-03, - "cpu_time": 2.5436178181144856e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2681781655634567e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2612703115676311e+06, - "cpu_time": 2.5783987831715187e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8113712363562754e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2610875560893016e+06, - "cpu_time": 2.5714699579288736e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8115176429011440e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2737555308297612e+06, - "cpu_time": 2.5835002103559040e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8014249748763654e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2605915107797459e+06, - "cpu_time": 2.5707884530743505e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8119151471940044e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2725284010666185e+06, - "cpu_time": 2.5828387572815497e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8023977161638681e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2658466620666115e+06, - "cpu_time": 2.5773992323624394e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8077253434983315e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2612703115676306e+06, - "cpu_time": 2.5783987831715187e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8113712363562754e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6784079280637188e+03, - "cpu_time": 6.0553316122564847e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3222829285842572e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9474227183460600e-03, - "cpu_time": 2.3493960641503644e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9441878146624378e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2627610869970908e+06, - "cpu_time": 2.5745981229774007e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6203557004206749e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2686448552522170e+06, - "cpu_time": 2.5875358996763667e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6109662475527721e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2624390046067028e+06, - "cpu_time": 2.5752819967637444e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6208710967764091e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2682849706593649e+06, - "cpu_time": 2.5807195792879709e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6115391610687603e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2688954473325447e+06, - "cpu_time": 2.5815525372167998e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6105674281426356e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2662050729695838e+06, - "cpu_time": 2.5799376271844562e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6148599267922509e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2682849706593649e+06, - "cpu_time": 2.5807195792879704e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6115391610687603e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3000354729551664e+03, - "cpu_time": 5.2711082363669739e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2666749470190953e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4561945484619688e-03, - "cpu_time": 2.0431146012314461e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4569513214008902e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2807137514720745e+06, - "cpu_time": 2.5953531262136633e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1837160579336332e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2684812182590701e+06, - "cpu_time": 2.5846711067961855e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2224534495259272e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2688395295497091e+06, - "cpu_time": 2.5895063365695826e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2213128282596925e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2763999519586372e+06, - "cpu_time": 2.5911296051779934e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.1973292680414282e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2746823964682692e+06, - "cpu_time": 2.5900107993526775e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2027637904255213e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2738233695415519e+06, - "cpu_time": 2.5901341948220204e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2055150788372420e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2746823964682692e+06, - "cpu_time": 2.5900107993526771e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2027637904255213e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2017138701465346e+03, - "cpu_time": 3.8237040239401044e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6479166293786868e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2876508086884968e-03, - "cpu_time": 1.4762571111505084e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2870212765478135e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 306, - "real_time": 2.2856059234613688e+06, - "cpu_time": 2.6044336960784541e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4336679680272909e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 306, - "real_time": 2.2942151180377193e+06, - "cpu_time": 2.6139578006537328e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4282880337754473e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 306, - "real_time": 2.2919960030859788e+06, - "cpu_time": 2.6110701601307075e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4296709050050987e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 306, - "real_time": 2.2857669973745942e+06, - "cpu_time": 2.6110155359476511e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4335669400090626e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 306, - "real_time": 2.2857126040274608e+06, - "cpu_time": 2.6103111862745117e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4336010547547527e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2886593291974245e+06, - "cpu_time": 2.6101576758170119e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4317589803143306e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2857669973745942e+06, - "cpu_time": 2.6110155359476516e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4335669400090626e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1343754506321611e+03, - "cpu_time": 3.4927428302132366e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5842658030134982e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8064617122732650e-03, - "cpu_time": 1.3381348041052595e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8049586826730743e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 302, - "real_time": 2.3251732006447008e+06, - "cpu_time": 2.6527681225165124e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8185427211112201e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 302, - "real_time": 2.3161888065507375e+06, - "cpu_time": 2.6516630927152927e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8294757238550015e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 302, - "real_time": 2.3155615014326298e+06, - "cpu_time": 2.6435575198676032e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8302422526654165e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 302, - "real_time": 2.3244102616541530e+06, - "cpu_time": 2.6589586754966862e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8194678487334538e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 302, - "real_time": 2.3151954292128514e+06, - "cpu_time": 2.6435538344369647e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8306897626470231e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3193058398990151e+06, - "cpu_time": 2.6501002490066118e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8256836618024230e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3161888065507379e+06, - "cpu_time": 2.6516630927152927e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8294757238550015e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0277352512091602e+03, - "cpu_time": 6.5896623151849253e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1206800480012025e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1677758770391720e-03, - "cpu_time": 2.4865709580817012e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1660882039771555e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 289, - "real_time": 2.3932131249006437e+06, - "cpu_time": 2.7504868477508891e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4768210418134645e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 289, - "real_time": 2.3998507060059006e+06, - "cpu_time": 2.7517098754324852e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4616730812453181e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 289, - "real_time": 2.3935060242390758e+06, - "cpu_time": 2.7492958996539069e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4761508294790849e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 289, - "real_time": 2.3989112021330628e+06, - "cpu_time": 2.7465870069202627e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4638120778898969e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 289, - "real_time": 2.3882681258976664e+06, - "cpu_time": 2.7353766020761686e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4881610058223516e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3947498366352702e+06, - "cpu_time": 2.7466912463667430e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4733236072500229e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3935060242390758e+06, - "cpu_time": 2.7492958996539069e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4761508294790849e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7237950169392252e+03, - "cpu_time": 6.6032092119889830e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0800203440213522e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9725630396435754e-03, - "cpu_time": 2.4040595100463329e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9732440862636840e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 280, - "real_time": 2.5043751337632006e+06, - "cpu_time": 2.8866171678570495e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0467441417456067e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 280, - "real_time": 2.5026905865940666e+06, - "cpu_time": 2.8889367678571278e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0474486994285381e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 280, - "real_time": 2.5101345980406874e+06, - "cpu_time": 2.8876099607141931e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0443424038082235e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 280, - "real_time": 2.5077174484197581e+06, - "cpu_time": 2.8850166250001462e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0453490291148646e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 280, - "real_time": 2.5088346139195240e+06, - "cpu_time": 2.8906754964284329e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0448835429229644e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5067504761474472e+06, - "cpu_time": 2.8877712035713894e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0457535634040394e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5077174484197581e+06, - "cpu_time": 2.8876099607141926e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0453490291148646e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1167250941008542e+03, - "cpu_time": 2.1644258995253886e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3006427858947283e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2433328022703159e-03, - "cpu_time": 7.4951433023799847e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2437373693100287e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 270, - "real_time": 2.5935629736287175e+06, - "cpu_time": 3.0508407555556814e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0214970884877178e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 270, - "real_time": 2.5945751600105455e+06, - "cpu_time": 3.0449419814814334e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0207084692735171e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 270, - "real_time": 2.5927167920464720e+06, - "cpu_time": 3.0461692518517543e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0221568418437684e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 270, - "real_time": 2.5943956303375741e+06, - "cpu_time": 3.0445424518520501e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0208483003487846e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 270, - "real_time": 2.5938912829453195e+06, - "cpu_time": 3.0500270407405538e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0212412272139636e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5938283677937253e+06, - "cpu_time": 3.0473042962962943e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0212903854335505e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5938912829453191e+06, - "cpu_time": 3.0461692518517538e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0212412272139636e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3984431303815677e+02, - "cpu_time": 2.9332798758267227e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7661838160086430e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8523256288829095e-04, - "cpu_time": 9.6258187257237233e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8527241100846792e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 254, - "real_time": 2.7560443556904206e+06, - "cpu_time": 3.3461211732284534e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8046412345831776e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 254, - "real_time": 2.7471562438666467e+06, - "cpu_time": 3.3355273385824794e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8169507189154989e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 254, - "real_time": 2.7591060172385117e+06, - "cpu_time": 3.3493157047244078e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8004193874705887e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 254, - "real_time": 2.7475506113108806e+06, - "cpu_time": 3.3360946771652140e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8164028559958541e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 254, - "real_time": 2.7530341882141321e+06, - "cpu_time": 3.3410715944883553e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8088012291638178e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7525782832641182e+06, - "cpu_time": 3.3416260976377823e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8094430852257872e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7530341882141321e+06, - "cpu_time": 3.3410715944883553e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8088012291638178e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2323229718701668e+03, - "cpu_time": 6.0711347768977475e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2405083175147313e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9008807137958913e-03, - "cpu_time": 1.8168204938276828e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9006737088672330e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 227, - "real_time": 3.0995650239502150e+06, - "cpu_time": 4.0190401541849999e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7659558157205617e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 227, - "real_time": 3.0905739701709952e+06, - "cpu_time": 4.0085874889869667e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7856392380214369e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 227, - "real_time": 3.0937950713518956e+06, - "cpu_time": 4.0127411806166600e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7785743775317585e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 227, - "real_time": 3.0798074042646107e+06, - "cpu_time": 4.0050127665197491e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8093608616437268e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 227, - "real_time": 3.1237955562081104e+06, - "cpu_time": 4.0384159867841788e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7134739206354308e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0975074051891654e+06, - "cpu_time": 4.0167595154185109e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7706008427105832e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0937950713518960e+06, - "cpu_time": 4.0127411806166605e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7785743775317585e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6358825258536157e+04, - "cpu_time": 1.3182556708278475e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5626995243382510e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.2812868925287094e-03, - "cpu_time": 3.2818884619994402e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2620138258097906e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 193, - "real_time": 3.6365197455134108e+06, - "cpu_time": 5.1230571088081682e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1533840852025514e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 193, - "real_time": 3.6342572553536897e+06, - "cpu_time": 5.1187091088083973e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1541021191665215e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 193, - "real_time": 3.6375833303701384e+06, - "cpu_time": 5.1200089481864069e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1530468498087199e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 193, - "real_time": 3.6331853851039018e+06, - "cpu_time": 5.1162124507771414e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1544426048823960e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 193, - "real_time": 3.6439285866935481e+06, - "cpu_time": 5.1290621658032779e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1510390229150608e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6370948606069377e+06, - "cpu_time": 5.1214099564766781e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1532029363950498e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6365197455134108e+06, - "cpu_time": 5.1200089481864069e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1533840852025514e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2013442663488895e+03, - "cpu_time": 4.9381394836796935e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3308838302421439e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1551373905182647e-03, - "cpu_time": 9.6421484037511674e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1540759984556841e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 143, - "real_time": 4.8812964924617661e+06, - "cpu_time": 7.5440169860141743e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7185204817930255e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 143, - "real_time": 4.9270823096426632e+06, - "cpu_time": 7.5999528741256539e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7025508146236720e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 143, - "real_time": 4.9150028897748962e+06, - "cpu_time": 7.5854282307692962e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7067351104617953e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 143, - "real_time": 4.8997603500118619e+06, - "cpu_time": 7.5773664755244488e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7120445492767196e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 143, - "real_time": 4.9673108305860236e+06, - "cpu_time": 7.6637619720278839e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6887624483548467e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9180905744954431e+06, - "cpu_time": 7.5941053076922921e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7057226809020119e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9150028897748962e+06, - "cpu_time": 7.5854282307692943e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7067351104617953e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2414581247585069e+04, - "cpu_time": 4.4018646771500884e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1208088203964135e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.5908874097770232e-03, - "cpu_time": 5.7964230133750062e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5708736416854874e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 87, - "real_time": 7.8453139519725721e+06, - "cpu_time": 1.3374297000000063e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1385015440690746e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 87, - "real_time": 7.8550922930583190e+06, - "cpu_time": 1.3394036540229607e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1358394496301866e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 87, - "real_time": 8.3859814545032624e+06, - "cpu_time": 1.4155620839080816e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.0006264133807087e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 87, - "real_time": 7.8084438814428346e+06, - "cpu_time": 1.3315029563218897e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1485991645367279e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 87, - "real_time": 7.8409552124553714e+06, - "cpu_time": 1.3366876436781820e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1396903241264997e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9471573586864723e+06, - "cpu_time": 1.3521172075862240e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1126513791486394e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8453139519725721e+06, - "cpu_time": 1.3374297000000063e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1385015440690746e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4593442596692540e+05, - "cpu_time": 3.5586614240394632e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2806963018050157e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0946213201392320e-02, - "cpu_time": 2.6319178574705983e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9728976412265535e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3709847212714307e+07, - "cpu_time": 2.5045532431372344e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4474694341511059e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3752740004337301e+07, - "cpu_time": 2.5175919470588244e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4398361337026439e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3767447468696857e+07, - "cpu_time": 2.5234762803920291e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4372297098857980e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3688608036175663e+07, - "cpu_time": 2.5046667725492254e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4512669156223769e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3729746983039612e+07, - "cpu_time": 2.5136286058822781e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4439220942272182e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3729677940992748e+07, - "cpu_time": 2.5127833698039182e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4439448575178289e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3729746983039612e+07, - "cpu_time": 2.5136286058822781e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4439220942272182e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1774186146338248e+04, - "cpu_time": 8.2430169239052091e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6570865425375989e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3142703188594065e-03, - "cpu_time": 3.2804327754479062e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3147357540149942e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27, - "real_time": 2.5364701739615865e+07, - "cpu_time": 4.8290595777774364e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6457580573551950e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27, - "real_time": 2.5490669947531488e+07, - "cpu_time": 4.8426734962963231e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6326834146820378e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27, - "real_time": 2.5361726888351969e+07, - "cpu_time": 4.8279583259260207e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6460683965026641e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27, - "real_time": 2.5372405570966225e+07, - "cpu_time": 4.8275255851851597e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6449547250179944e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27, - "real_time": 2.5364382123505626e+07, - "cpu_time": 4.8294196259260185e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6457913965035644e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5390777253994234e+07, - "cpu_time": 4.8313273222221918e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6430511980122914e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5364701739615865e+07, - "cpu_time": 4.8290595777774356e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6457580573551950e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5983542374106066e+04, - "cpu_time": 6.3898547850072362e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8106283705637204e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2048770628043403e-03, - "cpu_time": 1.3225878436380072e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1984547158729302e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.7526455670595169e+07, - "cpu_time": 9.1149256933332860e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.8240634843519607e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.5911441991726555e+07, - "cpu_time": 8.7983553066669628e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9234047587567959e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5887942612171173e+07, - "cpu_time": 8.8038862799999163e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9249018447909346e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.6011464297771454e+07, - "cpu_time": 8.8095437733333409e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9170496972534037e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.5901159942150116e+07, - "cpu_time": 8.8070021333328441e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9240596135077310e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6247692902882889e+07, - "cpu_time": 8.8667426373332709e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9026958797321653e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5911441991726555e+07, - "cpu_time": 8.8070021333328441e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9234047587567959e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1652079693383467e+05, - "cpu_time": 1.3880131105236006e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4066589827596143e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5493114401154695e-02, - "cpu_time": 1.5654149074761623e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5181263092453975e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.8269122876226902e+07, - "cpu_time": 1.6871745199999565e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0411025651224232e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.7265998125076294e+07, - "cpu_time": 1.6666431049999630e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0760601123848696e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.7319738231599331e+07, - "cpu_time": 1.6675363062499571e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0741669802997460e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.7192459963262081e+07, - "cpu_time": 1.6672735999999589e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0786544629329572e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.8222160935401917e+07, - "cpu_time": 1.6891340462500182e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0427213882978220e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7653896026313305e+07, - "cpu_time": 1.6755523154999706e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0625411018075638e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7319738231599331e+07, - "cpu_time": 1.6675363062499571e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0741669802997460e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4232797677908815e+05, - "cpu_time": 1.1529382181718603e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8907650589604199e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1871519848505502e-03, - "cpu_time": 6.8809443161303701e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1738438639875179e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6903428733348846e+08, - "cpu_time": 3.1337246850000608e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1761065785476122e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6934141516685486e+08, - "cpu_time": 3.1548225725001091e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1703461995461202e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6897445172071457e+08, - "cpu_time": 3.1329356775000858e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1772312709577799e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7011498659849167e+08, - "cpu_time": 3.1617478425002331e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1559295435100732e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6832885146141052e+08, - "cpu_time": 3.1236108050001121e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1894170686661992e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6915879845619202e+08, - "cpu_time": 3.1413683165001202e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1738061322455573e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6903428733348846e+08, - "cpu_time": 3.1337246850000608e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1761065785476122e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4921941190453083e+05, - "cpu_time": 1.6133860373357858e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2168283808708604e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8379287263184403e-03, - "cpu_time": 5.1359340095888557e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8339719887361869e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.2319359481334686e+08, - "cpu_time": 5.6348445849999964e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3222868312724924e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.2153756916522980e+08, - "cpu_time": 5.6302530700003219e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3393977157556725e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.2895754277706146e+08, - "cpu_time": 5.7048785050000107e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2640741870074339e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2335719466209412e+08, - "cpu_time": 5.6419135449999654e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3206059482364459e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.2496936619281769e+08, - "cpu_time": 5.6674568300002193e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3041324374030528e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2440305352211004e+08, - "cpu_time": 5.6558693070001030e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3100994239350200e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2335719466209412e+08, - "cpu_time": 5.6419135449999654e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3206059482364459e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8209791800556527e+06, - "cpu_time": 3.0940127682568575e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8597365335876659e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.6959082210469590e-03, - "cpu_time": 5.4704460098246770e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6394279063316884e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1, - "real_time": 1.0666832923889160e+09, - "cpu_time": 3.1681850000495613e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.8399401483327874e+03, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1, - "real_time": 2.2102529183030128e+06, - "cpu_time": 2.4357109999755267e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8531815821081803e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1, - "real_time": 2.2384119220077991e+06, - "cpu_time": 2.3678329999938798e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8298687385143978e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1, - "real_time": 2.2441721521317959e+06, - "cpu_time": 2.3679939999965429e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8251719219085337e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1, - "real_time": 2.2403318434953690e+06, - "cpu_time": 2.3630349999166355e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8283005760474373e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1512329224497080e+08, - "cpu_time": 2.5405515999864293e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.4680725517453765e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2403318434953690e+06, - "cpu_time": 2.3679939999965425e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8283005760474373e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7603651200075901e+08, - "cpu_time": 3.5214883915875846e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1860655637420993e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2128543452127643e+00, - "cpu_time": 1.3861117371544018e-01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5760633587282649e-01, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 310, - "real_time": 2.2612638816597960e+06, - "cpu_time": 2.5824613677418861e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6227527739871601e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 310, - "real_time": 2.2549598763186126e+06, - "cpu_time": 2.5760325096774567e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6328806051192544e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 310, - "real_time": 2.2557531708791372e+06, - "cpu_time": 2.5823733741936674e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6316030077028875e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 310, - "real_time": 2.2592329217361347e+06, - "cpu_time": 2.5802695838709981e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6260094836546378e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 310, - "real_time": 2.2596122681974405e+06, - "cpu_time": 2.5803090419352031e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6254007447636141e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2581644237582246e+06, - "cpu_time": 2.5802891754838424e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6277293230455108e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2592329217361347e+06, - "cpu_time": 2.5803090419352031e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6260094836546378e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6892306272918804e+03, - "cpu_time": 2.6068316859330512e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3210908549529267e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1908923012861217e-03, - "cpu_time": 1.0102866417847263e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1911282430865963e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 309, - "real_time": 2.2690163617863241e+06, - "cpu_time": 2.5927742686086060e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2207500465538297e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 309, - "real_time": 2.2694684081322071e+06, - "cpu_time": 2.5934217961165342e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2193117741983375e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 309, - "real_time": 2.2675230455642091e+06, - "cpu_time": 2.5914459482199098e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2255053954361491e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 309, - "real_time": 2.2694580498058046e+06, - "cpu_time": 2.5995995728155035e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2193447247909969e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 309, - "real_time": 2.2637793217095453e+06, - "cpu_time": 2.5925190355986701e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2374545711581297e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2678490373996180e+06, - "cpu_time": 2.5939521242718445e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2244733024274893e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2690163617863236e+06, - "cpu_time": 2.5927742686086055e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2207500465538297e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4105385908951885e+03, - "cpu_time": 3.2363918382146721e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6874064279112126e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0629184531873350e-03, - "cpu_time": 1.2476683004021012e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0640784602703388e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 307, - "real_time": 2.2834224538446832e+06, - "cpu_time": 2.6142808436485208e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4350388796793735e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 307, - "real_time": 2.2843355663327035e+06, - "cpu_time": 2.6203602638435992e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4344652547088822e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 307, - "real_time": 2.2851037633596202e+06, - "cpu_time": 2.6152618469057339e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4339830219273552e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 307, - "real_time": 2.2790763862370378e+06, - "cpu_time": 2.6146607719873106e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4377754162993610e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 307, - "real_time": 2.2790227168776602e+06, - "cpu_time": 2.6094887296417537e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4378092748848632e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2821921773303412e+06, - "cpu_time": 2.6148104912053840e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4358143694999672e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2834224538446832e+06, - "cpu_time": 2.6146607719873106e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4350388796793735e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9299600516175624e+03, - "cpu_time": 3.8609515285001121e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8439550669857712e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2838358139694293e-03, - "cpu_time": 1.4765703065235439e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2842572871226675e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 299, - "real_time": 2.3308573921450903e+06, - "cpu_time": 2.6749481337792925e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8116692261334427e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 299, - "real_time": 2.3292841570433169e+06, - "cpu_time": 2.6685870033445838e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8135682716868818e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 299, - "real_time": 2.3267835403565182e+06, - "cpu_time": 2.6666190301006264e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8165920406140719e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 299, - "real_time": 2.3201116349822204e+06, - "cpu_time": 2.6600519866221314e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8246916662052006e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 299, - "real_time": 2.3291771351531097e+06, - "cpu_time": 2.6687138361202441e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8136975505597152e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3272427719360511e+06, - "cpu_time": 2.6677839979933756e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8160437510398626e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3291771351531101e+06, - "cpu_time": 2.6685870033445833e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8136975505597152e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2437748929007503e+03, - "cpu_time": 5.3379632849713180e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1443216518616427e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8235204956165022e-03, - "cpu_time": 2.0008978571677350e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8267903863219566e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 293, - "real_time": 2.4019036062201643e+06, - "cpu_time": 2.7640984982935875e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4570050047206439e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 293, - "real_time": 2.3998956596510606e+06, - "cpu_time": 2.7627524573379676e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4615707759168819e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 293, - "real_time": 2.3922330736414664e+06, - "cpu_time": 2.7556444846414886e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4790647886362381e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 293, - "real_time": 2.3928212125884183e+06, - "cpu_time": 2.7562667372016772e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4777180723090351e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 293, - "real_time": 2.3966721678629466e+06, - "cpu_time": 2.7634413651875900e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4689165150556937e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3967051439928114e+06, - "cpu_time": 2.7604407085324624e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4688550313276984e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3966721678629471e+06, - "cpu_time": 2.7627524573379671e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4689165150556937e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2511417143898943e+03, - "cpu_time": 4.1277520856004703e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6989680829972829e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7737441441410136e-03, - "cpu_time": 1.4953235810650372e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7734915311226711e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 280, - "real_time": 2.5054021896461821e+06, - "cpu_time": 2.9014373714285768e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0463150430830447e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 280, - "real_time": 2.5087285188159770e+06, - "cpu_time": 2.9003468928570850e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0449277314538674e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 280, - "real_time": 2.5023141884178454e+06, - "cpu_time": 2.8976413178570839e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0476062566937187e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 280, - "real_time": 2.5094422154195076e+06, - "cpu_time": 2.9088944000002518e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0446305493277794e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 280, - "real_time": 2.5035233976918138e+06, - "cpu_time": 2.8955845285716057e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0471002597446871e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5058821019982654e+06, - "cpu_time": 2.9007809021429205e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0461159680606195e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5054021896461821e+06, - "cpu_time": 2.9003468928570850e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0463150430830447e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1344977848358317e+03, - "cpu_time": 5.0820136572175006e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3084147124478538e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2508560487886839e-03, - "cpu_time": 1.7519467442243630e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2507358193504172e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 268, - "real_time": 2.6073920967946970e+06, - "cpu_time": 3.0695197723881435e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0107754435725814e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 268, - "real_time": 2.6064995752730919e+06, - "cpu_time": 3.0708841902986448e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0114639763371858e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 268, - "real_time": 2.6096195675807991e+06, - "cpu_time": 3.0689331865674835e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0090591230737582e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 268, - "real_time": 2.6074900394375087e+06, - "cpu_time": 3.0703626567164734e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0106999147467506e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 268, - "real_time": 2.6091538837054437e+06, - "cpu_time": 3.0680603432838768e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0094177015555003e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6080310325583080e+06, - "cpu_time": 3.0695520298509244e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0102832318571553e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6074900394375087e+06, - "cpu_time": 3.0695197723881430e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0106999147467506e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3067624201571648e+03, - "cpu_time": 1.1225978511694987e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0071791732358250e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0105324815683504e-04, - "cpu_time": 3.6572041791518958e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0101356727995242e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 251, - "real_time": 2.7789130159449647e+06, - "cpu_time": 3.3766341035856837e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7733314932257187e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 251, - "real_time": 2.7843664281545170e+06, - "cpu_time": 3.3834588127489276e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7659411110447776e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 251, - "real_time": 2.7819440720521240e+06, - "cpu_time": 3.3774589920319133e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7692202748939854e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 251, - "real_time": 2.7851434600765845e+06, - "cpu_time": 3.3872485657368260e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7648904447139931e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 251, - "real_time": 2.7794746303582098e+06, - "cpu_time": 3.3754256175296474e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7725690623226267e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7819683213172806e+06, - "cpu_time": 3.3800452183265993e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7691904772402203e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7819440720521240e+06, - "cpu_time": 3.3774589920319133e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.7692202748939854e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8011781486429950e+03, - "cpu_time": 5.0795133265442510e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7951415931424743e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0069051208018856e-03, - "cpu_time": 1.5027944889622002e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0068850635325957e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 226, - "real_time": 3.0977783191009564e+06, - "cpu_time": 3.9744891902655903e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7698582144142568e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 226, - "real_time": 3.0999326577772740e+06, - "cpu_time": 3.9765573141592909e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7651534130541670e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 226, - "real_time": 3.0973818332401919e+06, - "cpu_time": 3.9735857256635958e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7707248021344376e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 226, - "real_time": 3.1008884409623863e+06, - "cpu_time": 3.9777797876105770e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7630681978005362e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 226, - "real_time": 3.0967687571882806e+06, - "cpu_time": 3.9740633451331235e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7720652216348076e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0985500016538179e+06, - "cpu_time": 3.9752950725664357e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7681739698076415e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0977783191009564e+06, - "cpu_time": 3.9744891902655908e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7698582144142568e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7686845113312745e+03, - "cpu_time": 1.7927303391437297e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8625748251652031e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7081038240056092e-04, - "cpu_time": 4.5096786689254487e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7069674071557317e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 186, - "real_time": 3.7568463300484964e+06, - "cpu_time": 5.2278669623653451e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1164427904470227e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 186, - "real_time": 3.7763311367441891e+06, - "cpu_time": 5.2467479892470688e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1106822596114204e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 186, - "real_time": 3.7599689394776379e+06, - "cpu_time": 5.2323836720429473e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1155155980045683e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 186, - "real_time": 3.7430793495087693e+06, - "cpu_time": 5.2167813817202849e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1205490475510352e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 186, - "real_time": 3.7434096773585645e+06, - "cpu_time": 5.2152901397852069e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1204501674953187e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7559270866275318e+06, - "cpu_time": 5.2278140290321717e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1167279726218729e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7568463300484968e+06, - "cpu_time": 5.2278669623653460e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1164427904470227e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3740967287380223e+04, - "cpu_time": 1.2825232913702308e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0791290486475173e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6584755162854645e-03, - "cpu_time": 2.4532687739997235e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6527508477023898e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 135, - "real_time": 5.1696518436074257e+06, - "cpu_time": 7.9167009407405602e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6226640117695742e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 135, - "real_time": 5.1628927182820104e+06, - "cpu_time": 7.9120605333333444e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6247883614345891e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 135, - "real_time": 5.2378739471788760e+06, - "cpu_time": 7.9831433185181264e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6015291861916823e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 135, - "real_time": 5.2128687362979958e+06, - "cpu_time": 7.9638144000000460e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6092114389124839e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 135, - "real_time": 5.2061913224558039e+06, - "cpu_time": 7.9659328000001628e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6112753989307916e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1978957135644229e+06, - "cpu_time": 7.9483303985184459e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6138936794478245e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2061913224558029e+06, - "cpu_time": 7.9638144000000460e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6112753989307916e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1281758136626326e+04, - "cpu_time": 3.1927511485669074e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7117491653604805e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.0181580894348241e-03, - "cpu_time": 4.0168827772459363e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0175891937833516e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 83, - "real_time": 8.3994057859821487e+06, - "cpu_time": 1.3921480048192147e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9974289166978526e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 83, - "real_time": 8.4042828866695780e+06, - "cpu_time": 1.3912244385541689e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9962697860410099e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 83, - "real_time": 8.4093972053154409e+06, - "cpu_time": 1.3919124783132775e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9950557204499032e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 83, - "real_time": 8.3998279556272980e+06, - "cpu_time": 1.3904219927709790e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9973285272778044e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 83, - "real_time": 8.4031263747847229e+06, - "cpu_time": 1.3907753084337734e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9965445301814601e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4032080416758396e+06, - "cpu_time": 1.3912964445782825e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9965254961296060e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4031263747847229e+06, - "cpu_time": 1.3912244385541689e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.9965445301814601e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0419623280579531e+03, - "cpu_time": 7.3247629996794685e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6008049729176355e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.8100229198322591e-04, - "cpu_time": 5.2647033119528205e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8087565080082460e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 48, - "real_time": 1.4458232268225402e+07, - "cpu_time": 2.5229359333335329e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3207838536210251e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 48, - "real_time": 1.4469239026463280e+07, - "cpu_time": 2.5231812895832207e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3190184320427055e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 48, - "real_time": 1.4457052418341240e+07, - "cpu_time": 2.5279500270833921e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3209732543703361e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 48, - "real_time": 1.4462409094752124e+07, - "cpu_time": 2.5231539687498618e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3201135979603615e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 48, - "real_time": 1.4443018900540968e+07, - "cpu_time": 2.5210551958333362e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3232284213616314e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4457990341664603e+07, - "cpu_time": 2.5236552829166692e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3208235118712120e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4458232268225402e+07, - "cpu_time": 2.5231539687498622e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.3207838536210251e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6325044292365710e+03, - "cpu_time": 2.5592347336368330e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5467608249499986e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.6624089528389760e-04, - "cpu_time": 1.0140983798227164e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6647068035901214e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.6540717396598596e+07, - "cpu_time": 4.8456087807695583e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5285248698138256e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.6534052494053658e+07, - "cpu_time": 4.8429097115383856e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5291599922416396e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.6399233091909152e+07, - "cpu_time": 4.8192482846152768e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5420762704113383e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.7032929400985058e+07, - "cpu_time": 4.8453032115385383e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.4824858232920403e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.6446193743210573e+07, - "cpu_time": 4.8381510153844304e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5375622916333127e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6590625225351412e+07, - "cpu_time": 4.8382442007692382e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5239618494784312e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6534052494053654e+07, - "cpu_time": 4.8429097115383863e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.5291599922416396e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5436963795677113e+05, - "cpu_time": 1.1030493828377151e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3880990680502348e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5661397880278509e-03, - "cpu_time": 2.2798547098187810e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4617082605417662e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 14, - "real_time": 4.9852250143885612e+07, - "cpu_time": 9.1031877714288250e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.6923103292753143e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 14, - "real_time": 4.9656019679137640e+07, - "cpu_time": 9.0898268428572580e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7029497907257743e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 14, - "real_time": 4.9459641267146386e+07, - "cpu_time": 9.0683224785720989e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7136817931017680e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 14, - "real_time": 4.9615847479019843e+07, - "cpu_time": 9.0811758928566620e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7051382737492132e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 14, - "real_time": 4.9564088029520854e+07, - "cpu_time": 9.0839077357145458e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7079632317668920e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9629569319742069e+07, - "cpu_time": 9.0852841442858800e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7044086837237926e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9615847479019850e+07, - "cpu_time": 9.0839077357145458e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.7051382737492132e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4460117763481213e+05, - "cpu_time": 1.2724448016099671e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8685484695056686e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9136093586307121e-03, - "cpu_time": 1.4005558674906845e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9095264028923306e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7, - "real_time": 9.5738101218427926e+07, - "cpu_time": 1.7366462157143098e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8038518895163841e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7, - "real_time": 9.5605049814496726e+07, - "cpu_time": 1.7335193771428490e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8077539473160419e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7, - "real_time": 9.5439584127494261e+07, - "cpu_time": 1.7348835228571197e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8126218115264087e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7, - "real_time": 9.6421739884785250e+07, - "cpu_time": 1.7393116314285961e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.7839723315587821e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7, - "real_time": 9.5554738172463015e+07, - "cpu_time": 1.7356145085713187e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8092322906637173e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5751842643533438e+07, - "cpu_time": 1.7359950511428386e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8034864541162672e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5605049814496726e+07, - "cpu_time": 1.7356145085713187e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.8077539473160419e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8950443790964299e+05, - "cpu_time": 2.1756027682302037e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1353583278679907e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0678531833554018e-03, - "cpu_time": 1.2532309736700933e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0498085025557420e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8570537865161896e+08, - "cpu_time": 3.2938602275001472e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8909820270050621e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8775499239563942e+08, - "cpu_time": 3.3326025549999374e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8594228315841508e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8552822247147560e+08, - "cpu_time": 3.2957910950000268e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8937425522014165e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8765056133270264e+08, - "cpu_time": 3.3354922750001490e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8610141541124039e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8545182049274445e+08, - "cpu_time": 3.2938573475001931e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8949347090448451e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8641819506883621e+08, - "cpu_time": 3.3103207000000912e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8800192547895756e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8570537865161896e+08, - "cpu_time": 3.2957910950000268e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 2.8909820270050621e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1768381357778036e+06, - "cpu_time": 2.1697855897042407e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8141034581549089e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.3128930914884565e-03, - "cpu_time": 6.5546084091012103e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2989282281289945e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.6258032917976379e+08, - "cpu_time": 6.0426293399996209e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9613901736727953e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.6143581569194794e+08, - "cpu_time": 6.0432767550003064e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9707676366947293e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.6135415732860565e+08, - "cpu_time": 6.0327049649998796e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9714389670728717e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.6245046555995941e+08, - "cpu_time": 6.0458062499998271e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9624512203099189e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.6057326197624207e+08, - "cpu_time": 6.0271329649998510e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9778742275980191e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6167880594730377e+08, - "cpu_time": 6.0383100549998975e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9687844450696673e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6143581569194794e+08, - "cpu_time": 6.0426293399996209e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 2.9707676366947293e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3589340801579633e+05, - "cpu_time": 7.9978379267321900e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8627375703402795e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3111484396395213e-03, - "cpu_time": 1.3245159413617302e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3116321502348867e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 311, - "real_time": 2.2481399164550076e+06, - "cpu_time": 2.5754388842441528e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8219506579727479e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 311, - "real_time": 2.2596620214905385e+06, - "cpu_time": 2.5861996302250880e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8126604603011205e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 311, - "real_time": 2.2484578575543654e+06, - "cpu_time": 2.5752929549839660e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8216930267286377e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 311, - "real_time": 2.2478554108841913e+06, - "cpu_time": 2.5860079453374185e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8221812578189105e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 311, - "real_time": 2.2477700226787492e+06, - "cpu_time": 2.5750290482314806e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8222504787739131e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2503770458125705e+06, - "cpu_time": 2.5795936926044207e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8201471763190657e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2481399164550076e+06, - "cpu_time": 2.5754388842441528e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8219506579727479e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1974517074072555e+03, - "cpu_time": 5.9450778971183618e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1908974297982813e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3095915047118471e-03, - "cpu_time": 2.3046567039462966e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3025047008965781e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 311, - "real_time": 2.2459848270335286e+06, - "cpu_time": 2.5894702347265924e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6473977479268643e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 311, - "real_time": 2.2475328401234183e+06, - "cpu_time": 2.5760320932475580e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6448855624063564e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 311, - "real_time": 2.2513224740312030e+06, - "cpu_time": 2.5886783601284698e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6387501544065606e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 311, - "real_time": 2.2476028165872842e+06, - "cpu_time": 2.5762221543410071e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6447720831915364e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 311, - "real_time": 2.2516573563673296e+06, - "cpu_time": 2.5891986302251648e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6382089738628855e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2488200628285529e+06, - "cpu_time": 2.5839202945337584e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6428029043588410e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2476028165872837e+06, - "cpu_time": 2.5886783601284693e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6447720831915364e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5243558172348635e+03, - "cpu_time": 7.1201638670991015e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0882972252100453e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1225245892104608e-03, - "cpu_time": 2.7555663702791811e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1222943795059959e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 310, - "real_time": 2.2566518468421795e+06, - "cpu_time": 2.5892057387097576e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2603135583039839e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 310, - "real_time": 2.2636918884311472e+06, - "cpu_time": 2.6019765096774087e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2377341120195203e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 310, - "real_time": 2.2562121296481742e+06, - "cpu_time": 2.5889537161289458e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2617285337238498e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 310, - "real_time": 2.2659370690704351e+06, - "cpu_time": 2.5996156290320428e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2305626769772889e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 310, - "real_time": 2.2589011741201244e+06, - "cpu_time": 2.5916725290321372e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2530840161176203e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2602788216224117e+06, - "cpu_time": 2.5942848245160584e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2486845794284530e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2589011741201240e+06, - "cpu_time": 2.5916725290321368e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2530840161176203e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3375001882808920e+03, - "cpu_time": 6.0955191405607320e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3901879561827693e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9190111179148534e-03, - "cpu_time": 2.3495951882221721e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9178485985279047e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2803527823129259e+06, - "cpu_time": 2.6251919837663574e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4369706413041905e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2735797676148931e+06, - "cpu_time": 2.6120555162338275e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4412513898456873e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2736031391246654e+06, - "cpu_time": 2.6182598831168250e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4412365744980296e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2817413759562974e+06, - "cpu_time": 2.6204818084414904e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4360961476743460e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2734093627977101e+06, - "cpu_time": 2.6127002954544346e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4413594197428193e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2765372855612980e+06, - "cpu_time": 2.6177378974025869e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4393828346130146e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2736031391246654e+06, - "cpu_time": 2.6182598831168250e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4412365744980296e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1467035351241557e+03, - "cpu_time": 5.5007228963586031e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6199106180334427e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8214959892922436e-03, - "cpu_time": 2.1013268371201780e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8201624717428418e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 301, - "real_time": 2.3001083087770152e+06, - "cpu_time": 2.6477229435214633e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8492571306281652e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 301, - "real_time": 2.3005016610657554e+06, - "cpu_time": 2.6532658305649967e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8487699491440088e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 301, - "real_time": 2.3079302797768498e+06, - "cpu_time": 2.6540371794020082e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8396005102171704e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 301, - "real_time": 2.3008004083078466e+06, - "cpu_time": 2.6463427275748504e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8484000508414067e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 301, - "real_time": 2.3006090470450465e+06, - "cpu_time": 2.6582485083057070e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8486369765508793e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3019899409945030e+06, - "cpu_time": 2.6519234378738059e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8469329234763265e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3006090470450465e+06, - "cpu_time": 2.6532658305649967e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8486369765508793e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3303527554815132e+03, - "cpu_time": 4.8750619892578407e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1108741763461941e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4467277620000103e-03, - "cpu_time": 1.8383117399371259e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4439659404853478e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 297, - "real_time": 2.3745762635812615e+06, - "cpu_time": 2.7401798888891479e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5198058706407398e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 297, - "real_time": 2.3600910931374086e+06, - "cpu_time": 2.7273697979796790e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5536839396210864e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 297, - "real_time": 2.3727903859094037e+06, - "cpu_time": 2.7391766801346503e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5239603455222577e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 297, - "real_time": 2.3611943631022167e+06, - "cpu_time": 2.7293242356903409e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5510889763345532e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 297, - "real_time": 2.3730947684672242e+06, - "cpu_time": 2.7389981212121500e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5232518204344220e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3683493748395029e+06, - "cpu_time": 2.7350097447811938e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5343581905106120e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3727903859094037e+06, - "cpu_time": 2.7389981212121500e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5239603455222577e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0782923971076616e+03, - "cpu_time": 6.1378882289557232e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6557780823716987e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9887027954173099e-03, - "cpu_time": 2.2441924533057804e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9918158987445897e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 281, - "real_time": 2.4901176463096696e+06, - "cpu_time": 2.8946695338078449e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0527374093689704e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 281, - "real_time": 2.4891598862711857e+06, - "cpu_time": 2.8889975017792168e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0531424736749123e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 281, - "real_time": 2.4942480196705703e+06, - "cpu_time": 2.8899019074733783e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0509941189995326e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 281, - "real_time": 2.4990981728090406e+06, - "cpu_time": 2.8958754661921230e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0489543902364767e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 281, - "real_time": 2.4960962964347778e+06, - "cpu_time": 2.8973040106760813e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0502158926096934e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4937440042990493e+06, - "cpu_time": 2.8933496839857292e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0512088569779171e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4942480196705707e+06, - "cpu_time": 2.8946695338078449e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0509941189995326e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1418305307713581e+03, - "cpu_time": 3.6941484715032793e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7457130969893077e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6608884166262124e-03, - "cpu_time": 1.2767722104071468e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6606719829282985e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 272, - "real_time": 2.5805253261590707e+06, - "cpu_time": 3.0489445036766604e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0317103447318831e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 272, - "real_time": 2.5826170903575770e+06, - "cpu_time": 3.0559452830884228e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0300647817962420e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 272, - "real_time": 2.5766729377210140e+06, - "cpu_time": 3.0488476323531484e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0347479585970125e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 272, - "real_time": 2.5805359071134315e+06, - "cpu_time": 3.0486031617647479e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0317020141233557e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 272, - "real_time": 2.5761211890152055e+06, - "cpu_time": 3.0463662132354877e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0351837570204678e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5792944900732599e+06, - "cpu_time": 3.0497413588236938e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0326817712537920e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5805253261590707e+06, - "cpu_time": 3.0488476323531484e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0317103447318831e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7855934165239232e+03, - "cpu_time": 3.6266203858531130e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1955233011744602e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0799826957505747e-03, - "cpu_time": 1.1891567051613601e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0801116693343615e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 256, - "real_time": 2.7409931944930577e+06, - "cpu_time": 3.3464274531249669e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8255330298035723e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 256, - "real_time": 2.7444050720077939e+06, - "cpu_time": 3.3496051445314200e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8207770809608173e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 256, - "real_time": 2.7394650423957501e+06, - "cpu_time": 3.3429534414062267e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8276670217444593e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 256, - "real_time": 2.7465463708722382e+06, - "cpu_time": 3.3509486445315597e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8177982761201191e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 256, - "real_time": 2.7354581916370080e+06, - "cpu_time": 3.3371812031250945e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8332737206723309e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7413735742811696e+06, - "cpu_time": 3.3454231773438537e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8250098258602595e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7409931944930577e+06, - "cpu_time": 3.3464274531249674e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8255330298035723e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3222314147100360e+03, - "cpu_time": 5.5465742055662431e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0321838675557624e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5766663307985639e-03, - "cpu_time": 1.6579589222461310e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5770374828250541e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 228, - "real_time": 3.0779122658841833e+06, - "cpu_time": 4.0012951447370900e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8135535351185739e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 228, - "real_time": 3.0732112303539589e+06, - "cpu_time": 3.9921912719298811e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8239761044946444e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 228, - "real_time": 3.0809031572732092e+06, - "cpu_time": 4.0088172368420898e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8069390465882409e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 228, - "real_time": 3.0850596284787906e+06, - "cpu_time": 4.0074188245613952e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7977681229911363e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 228, - "real_time": 3.0869846242447300e+06, - "cpu_time": 4.0095636271928470e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7935291401494908e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0808141812469745e+06, - "cpu_time": 4.0038572210526606e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8071531898684180e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0809031572732092e+06, - "cpu_time": 4.0074188245613948e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8069390465882409e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5301916959498139e+03, - "cpu_time": 7.2888348040043757e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2224104713229514e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7950422747377262e-03, - "cpu_time": 1.8204532283716290e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7957734125072342e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 194, - "real_time": 3.5934116626542406e+06, - "cpu_time": 5.0674140103094084e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1672205674598150e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 194, - "real_time": 3.5920220525628054e+06, - "cpu_time": 5.0656359845360965e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1676721185515785e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 194, - "real_time": 3.5893894004702722e+06, - "cpu_time": 5.0618927061852030e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1685285523633835e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 194, - "real_time": 3.5956610467035286e+06, - "cpu_time": 5.0709543247426292e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1664903742373888e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 194, - "real_time": 3.5967802648077304e+06, - "cpu_time": 5.0700995721653849e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1661273948366179e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5934528854397153e+06, - "cpu_time": 5.0671993195877448e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1672078014897568e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5934116626542406e+06, - "cpu_time": 5.0674140103094084e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1672205674598150e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9371892074703019e+03, - "cpu_time": 3.6456063663824266e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5421650742376072e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.1737239950229401e-04, - "cpu_time": 7.1945193714602568e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1752067301628188e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 143, - "real_time": 4.9604994205797054e+06, - "cpu_time": 7.7209309230768867e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6910813385438662e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 143, - "real_time": 4.9408484133077664e+06, - "cpu_time": 7.7042753146851426e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6978071979310229e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 143, - "real_time": 4.9527477687941147e+06, - "cpu_time": 7.7142267972023319e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6937280862260511e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 143, - "real_time": 4.9385513452539491e+06, - "cpu_time": 7.7029802167827431e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6985968988783779e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 143, - "real_time": 4.9418475530989524e+06, - "cpu_time": 7.6992068461534027e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6974639362842426e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9468989002068983e+06, - "cpu_time": 7.7083240195801016e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6957354915727122e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9418475530989524e+06, - "cpu_time": 7.7042753146851435e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.6974639362842426e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3673581010224916e+03, - "cpu_time": 8.9700597873566694e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2077233657284100e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8935818762398221e-03, - "cpu_time": 1.1636848379195789e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8916413448145752e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 87, - "real_time": 7.8320522396557629e+06, - "cpu_time": 1.3373907885058291e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1421225863449295e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 87, - "real_time": 7.9068590715613170e+06, - "cpu_time": 1.3498262333334016e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1218559541983981e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 87, - "real_time": 7.8452385630158857e+06, - "cpu_time": 1.3402879344828332e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1385220940369291e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 87, - "real_time": 7.8592228478398817e+06, - "cpu_time": 1.3400996965516638e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1347169211026051e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 87, - "real_time": 7.8446261113745039e+06, - "cpu_time": 1.3407933425287671e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1386890543672276e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8575997666894700e+06, - "cpu_time": 1.3416795990804991e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1351813220100179e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8452385630158857e+06, - "cpu_time": 1.3402879344828334e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1385220940369291e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9167210763729363e+04, - "cpu_time": 4.7428846397385074e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8966320369939990e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7119746016305391e-03, - "cpu_time": 3.5350352222609446e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6983425976957612e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3673750428008098e+07, - "cpu_time": 2.5017834568627987e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4539304104359016e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3719416442601120e+07, - "cpu_time": 2.5088139823528938e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4457623354742541e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3571591463451292e+07, - "cpu_time": 2.4753433529411390e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4724021563987617e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3710851744547779e+07, - "cpu_time": 2.5048037725491218e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4472901191819224e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3665900930908380e+07, - "cpu_time": 2.5012202666666068e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4553399127978029e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3668302201903334e+07, - "cpu_time": 2.4983929662745126e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4549449868577285e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3673750428008098e+07, - "cpu_time": 2.5017834568627991e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4539304104359016e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8761265693269423e+04, - "cpu_time": 1.3233194455156181e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0593113161023062e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2990903204559536e-03, - "cpu_time": 5.2966825610660066e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3150104046046243e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5388796946832113e+07, - "cpu_time": 4.8322486035711363e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6432471038519812e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.5318739736186605e+07, - "cpu_time": 4.8245592821428671e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6505609955018888e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.5423180444964342e+07, - "cpu_time": 4.8343840785715230e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6396722528590040e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5372728572360106e+07, - "cpu_time": 4.8317072321428411e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6449210540605922e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5365237013569899e+07, - "cpu_time": 4.8310743678570136e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6457022248243961e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5373736542782616e+07, - "cpu_time": 4.8307947128570765e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6448207262195725e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5372728572360110e+07, - "cpu_time": 4.8317072321428411e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6449210540605922e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7978355578041774e+04, - "cpu_time": 3.7009741617712985e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9598251919396645e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4967584893934138e-03, - "cpu_time": 7.6612118331611558e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4971998490044048e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.6163347611824669e+07, - "cpu_time": 8.8437132866662681e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9074522309040761e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.6018034716447197e+07, - "cpu_time": 8.8283907933335587e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9166332031999960e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.6098014215628304e+07, - "cpu_time": 8.8362695866665795e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9115728797379966e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.6501524001359940e+07, - "cpu_time": 8.8513707866665453e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.8863081561816082e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.6235444148381554e+07, - "cpu_time": 8.8499153266661778e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9029185394923525e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6203272938728333e+07, - "cpu_time": 8.8419319559998259e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9049770019032059e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6163347611824669e+07, - "cpu_time": 8.8437132866662666e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9074522309040761e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8505087989508553e+05, - "cpu_time": 9.6361867879594138e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1600242020813186e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0051465648437406e-03, - "cpu_time": 1.0898281999807333e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9932302435486565e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.7834523990750313e+07, - "cpu_time": 1.6739108562499893e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0561497211309352e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.7579902261495590e+07, - "cpu_time": 1.6726854674999458e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0650348889235673e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.7602465413510799e+07, - "cpu_time": 1.6582776075000539e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0642454494048929e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.7787705473601818e+07, - "cpu_time": 1.6745306925000137e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0577796122114139e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.7882065214216709e+07, - "cpu_time": 1.6736816487500051e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0544964475479250e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7737332470715046e+07, - "cpu_time": 1.6706172545000017e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0595412238437471e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7787705473601818e+07, - "cpu_time": 1.6736816487500051e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0577796122114139e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3775393997760961e+05, - "cpu_time": 6.9299659934480512e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8053467149499217e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5700721243558334e-03, - "cpu_time": 4.1481470245691423e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5706102200881260e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7017837986350060e+08, - "cpu_time": 3.1684936249999398e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1547539260311565e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6972714290022850e+08, - "cpu_time": 3.1322809249999750e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1631411619035578e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7027433961629868e+08, - "cpu_time": 3.1675417675000972e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1529760339097548e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6973597928881645e+08, - "cpu_time": 3.1395536700000548e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1629764900138254e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7047281935811043e+08, - "cpu_time": 3.1726963400001293e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1493050564981918e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7007773220539093e+08, - "cpu_time": 3.1561132655000395e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1566305336712976e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7017837986350060e+08, - "cpu_time": 3.1675417675000972e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1547539260311565e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3338648751596780e+05, - "cpu_time": 1.8715521472918182e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1886808458022783e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9602006870209224e-03, - "cpu_time": 5.9299270648808557e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9605337969675453e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.2444499433040619e+08, - "cpu_time": 5.6518055100002587e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3094726155846615e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.2668259739875793e+08, - "cpu_time": 5.6707933399997044e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2868044779543633e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.2603237032890320e+08, - "cpu_time": 5.6564865950002742e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2933595609442201e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2599011063575745e+08, - "cpu_time": 5.6696952800001550e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2937864952588615e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.2592433691024780e+08, - "cpu_time": 5.6681365550002742e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2944512035493817e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2581488192081451e+08, - "cpu_time": 5.6633834560001349e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2955748706582975e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2599011063575745e+08, - "cpu_time": 5.6681365550002742e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.2937864952588615e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2454667331180233e+05, - "cpu_time": 8.6451283738346561e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.3581638787475331e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5307213361487847e-03, - "cpu_time": 1.5264953258066042e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5361778162478745e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 311, - "real_time": 2.2522889315734627e+06, - "cpu_time": 2.5875881479097246e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8185943830654577e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 311, - "real_time": 2.2476633196139643e+06, - "cpu_time": 2.5764016848873375e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8223369862633552e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 311, - "real_time": 2.2496990941860187e+06, - "cpu_time": 2.5902749292604499e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8206879358157031e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 311, - "real_time": 2.2485518050934053e+06, - "cpu_time": 2.5772533794213030e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8216169139273406e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 311, - "real_time": 2.2484314106883919e+06, - "cpu_time": 2.5768717395498496e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8217144541429202e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2493269122310490e+06, - "cpu_time": 2.5816779762057327e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8209901346429554e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2485518050934048e+06, - "cpu_time": 2.5772533794213030e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8216169139273406e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8084753575546874e+03, - "cpu_time": 6.6961546608113003e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4630832212171088e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0400734447306642e-04, - "cpu_time": 2.5937218826387379e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0345477626872367e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2474360597839989e+06, - "cpu_time": 2.5786197142857071e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6450425204921439e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2594324576172540e+06, - "cpu_time": 2.5926419090906577e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6256892620897796e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2471451749359923e+06, - "cpu_time": 2.5786728766233153e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6455143581158887e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2473586284761112e+06, - "cpu_time": 2.5790231396102072e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6451681081069075e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2542459630201776e+06, - "cpu_time": 2.5979222077923282e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6340311280959691e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2511236567667066e+06, - "cpu_time": 2.5853759694804433e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6390890753801377e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2474360597839989e+06, - "cpu_time": 2.5790231396102067e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6450425204921439e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5314350563186563e+03, - "cpu_time": 9.2349723829490722e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9277689371869819e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4571884532826895e-03, - "cpu_time": 3.5720036435570850e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4532977215608251e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 310, - "real_time": 2.2546913947970155e+06, - "cpu_time": 2.5882727032258264e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2666263941079229e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 310, - "real_time": 2.2600152785138739e+06, - "cpu_time": 2.6009969258064949e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2495085125148734e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 310, - "real_time": 2.2540906346553275e+06, - "cpu_time": 2.5881876677420135e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2685630950706089e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 310, - "real_time": 2.2699910861950726e+06, - "cpu_time": 2.6036862677418897e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2176494875416588e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 310, - "real_time": 2.2538222334978562e+06, - "cpu_time": 2.5877414677420203e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2694286871829210e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2585221255318294e+06, - "cpu_time": 2.5937770064516487e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2543552352835974e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2546913947970155e+06, - "cpu_time": 2.5882727032258264e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2666263941079229e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8950735855507401e+03, - "cpu_time": 7.8785544920033572e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2081984793313062e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0529138978114333e-03, - "cpu_time": 3.0374833582095073e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0439624304460745e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 308, - "real_time": 2.2715665490741464e+06, - "cpu_time": 2.6222690974024073e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4425287259735225e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 308, - "real_time": 2.2714351358303390e+06, - "cpu_time": 2.6107050162334433e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4426121830690723e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 308, - "real_time": 2.2830772478218107e+06, - "cpu_time": 2.6215686850652625e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4352558605392171e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 308, - "real_time": 2.2712096786610298e+06, - "cpu_time": 2.6102533376623732e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4427553874866394e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 308, - "real_time": 2.2771514962765980e+06, - "cpu_time": 2.6220150811689286e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4389907765723716e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2748880215327847e+06, - "cpu_time": 2.6173622435064828e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4404285867281646e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2715665490741464e+06, - "cpu_time": 2.6215686850652625e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4425287259735225e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2122823785688761e+03, - "cpu_time": 6.2903791881973220e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2945816832457087e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2912259105645648e-03, - "cpu_time": 2.4033277028441026e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2872232012064735e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 303, - "real_time": 2.3176034423753177e+06, - "cpu_time": 2.6638909339933940e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8277486476647612e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 303, - "real_time": 2.3172448947103601e+06, - "cpu_time": 2.6712845841586278e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8281861856552523e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 303, - "real_time": 2.3083281618767348e+06, - "cpu_time": 2.6555796930694454e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8391110537211232e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 303, - "real_time": 2.3163445555165461e+06, - "cpu_time": 2.6701155940595572e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8292854724018138e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 303, - "real_time": 2.3079627530077603e+06, - "cpu_time": 2.6554228943893844e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8395605567981038e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3134967614973439e+06, - "cpu_time": 2.6632587399340817e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8327783832482114e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3163445555165457e+06, - "cpu_time": 2.6638909339933936e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8292854724018138e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9082311780974505e+03, - "cpu_time": 7.6190309339572977e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0143066582680585e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1215638853631855e-03, - "cpu_time": 2.8607926145943585e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1231123104560479e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 295, - "real_time": 2.3887250169922234e+06, - "cpu_time": 2.7552692033896935e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4871112860466480e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 295, - "real_time": 2.3735488378206049e+06, - "cpu_time": 2.7401872169494415e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5221952003460974e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 295, - "real_time": 2.3858769986210233e+06, - "cpu_time": 2.7520504915254591e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.4936612438845888e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 295, - "real_time": 2.3801571113388920e+06, - "cpu_time": 2.7512276237287596e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5068633652620114e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 295, - "real_time": 2.3726094308924875e+06, - "cpu_time": 2.7389218237288534e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5243816488875531e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3801834791330462e+06, - "cpu_time": 2.7475312718644417e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5068425488853805e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3801571113388920e+06, - "cpu_time": 2.7512276237287601e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5068633652620114e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1895653644080912e+03, - "cpu_time": 7.4501625407375222e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6631249981397970e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0205929195957640e-03, - "cpu_time": 2.7115842563938974e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0201063193216302e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 281, - "real_time": 2.4990964609652334e+06, - "cpu_time": 2.9011274555159616e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0489551087545910e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 281, - "real_time": 2.5028164069304154e+06, - "cpu_time": 2.9000137615658301e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0473960426106806e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 281, - "real_time": 2.4975249154354013e+06, - "cpu_time": 2.8981758291815515e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0496151545070758e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 281, - "real_time": 2.4965984475039928e+06, - "cpu_time": 2.8949153665481065e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0500046583866218e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 281, - "real_time": 2.4971008396896389e+06, - "cpu_time": 2.8982136156581328e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0497934077527341e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4986274141049366e+06, - "cpu_time": 2.8984892056939164e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0491528744023407e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4975249154354013e+06, - "cpu_time": 2.8982136156581333e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0496151545070758e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5214234115718641e+03, - "cpu_time": 2.3574940973804892e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0577205467419076e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0091234080512534e-03, - "cpu_time": 8.1335272622348449e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0081662763822170e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 271, - "real_time": 2.5881987539329650e+06, - "cpu_time": 3.0502610184501675e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0256867800562242e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 271, - "real_time": 2.5907073993015885e+06, - "cpu_time": 3.0581838044277513e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0237252579791117e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 271, - "real_time": 2.5848977944755247e+06, - "cpu_time": 3.0521341217711600e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0282736173186994e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 271, - "real_time": 2.5869423722868916e+06, - "cpu_time": 3.0496167822880410e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0266705807463443e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 271, - "real_time": 2.5830539218339091e+06, - "cpu_time": 3.0482541328415694e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0297214687170273e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5867600483661760e+06, - "cpu_time": 3.0516899719557380e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0268155409634817e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5869423722868916e+06, - "cpu_time": 3.0502610184501670e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0266705807463443e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9533057133673674e+03, - "cpu_time": 3.8894775733283814e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3138369828058328e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1417006827644121e-03, - "cpu_time": 1.2745323440689258e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1416120194667101e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 254, - "real_time": 2.7463891933943462e+06, - "cpu_time": 3.3477639645666853e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8180167709735012e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 254, - "real_time": 2.7427701765348711e+06, - "cpu_time": 3.3500611062993985e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8230545489040488e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 254, - "real_time": 2.7467803424590919e+06, - "cpu_time": 3.3491023464569831e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8174730748992044e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 254, - "real_time": 2.7447185134441834e+06, - "cpu_time": 3.3511427125982507e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8203407557600671e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 254, - "real_time": 2.7438909609208074e+06, - "cpu_time": 3.3434887283465462e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8214929635837793e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7449098373506600e+06, - "cpu_time": 3.3483117716535726e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8200756228241205e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7447185134441834e+06, - "cpu_time": 3.3491023464569831e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8203407557600671e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6837566694615452e+03, - "cpu_time": 2.9690590345878450e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3433564355428304e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1341055598630463e-04, - "cpu_time": 8.8673314705146682e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1343194923728361e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 228, - "real_time": 3.0811807526716669e+06, - "cpu_time": 4.0093141842106162e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8063257833269811e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 228, - "real_time": 3.0810264421202112e+06, - "cpu_time": 4.0125437587718945e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8066666722822511e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 228, - "real_time": 3.0812895509594101e+06, - "cpu_time": 4.0101601491228351e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8060854564836895e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 228, - "real_time": 3.0940888508778522e+06, - "cpu_time": 4.0107215131579204e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7779307611188924e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 228, - "real_time": 3.0952805812519630e+06, - "cpu_time": 4.0278122982458668e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7753211540898657e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0865732355762208e+06, - "cpu_time": 4.0141103807018274e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.7944659654603362e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0812895509594101e+06, - "cpu_time": 4.0107215131579200e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8060854564836895e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4173016441286672e+03, - "cpu_time": 7.7506306547005370e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6313046032424478e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4030862312405033e-03, - "cpu_time": 1.9308464191623493e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4009313042926165e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 194, - "real_time": 3.6026124468015642e+06, - "cpu_time": 5.0735836597937122e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1642395794540002e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 194, - "real_time": 3.5970190782388002e+06, - "cpu_time": 5.0683627835047850e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1660499732610946e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 194, - "real_time": 3.5964309792370372e+06, - "cpu_time": 5.0685040463918084e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1662406491921051e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 194, - "real_time": 3.5940235895920815e+06, - "cpu_time": 5.0628527628865391e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1670218337314947e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 194, - "real_time": 3.5976772100578262e+06, - "cpu_time": 5.0685517577320067e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1658366649109645e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5975526607854618e+06, - "cpu_time": 5.0683710020617703e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1658777401099319e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5970190782388002e+06, - "cpu_time": 5.0685040463918084e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1660499732610946e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1469894485355617e+03, - "cpu_time": 3.7971438340766390e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0192613722495325e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7475841086047433e-04, - "cpu_time": 7.4918427094859338e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7424378833532337e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 144, - "real_time": 4.8442672381901909e+06, - "cpu_time": 7.5475284097221456e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7316567372393701e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 144, - "real_time": 4.8791874529949082e+06, - "cpu_time": 7.5897738125002934e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7192633160365596e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 144, - "real_time": 4.8782897194743985e+06, - "cpu_time": 7.5937097847224139e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7195797056727114e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 144, - "real_time": 4.8689474028328229e+06, - "cpu_time": 7.5866650624997569e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7228791576428590e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 144, - "real_time": 4.9301943702933686e+06, - "cpu_time": 7.6671767777780378e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7014761224314246e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8801772367571387e+06, - "cpu_time": 7.5969707694445299e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7189710078045850e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8782897194743985e+06, - "cpu_time": 7.5897738125002934e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7195797056727114e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1312510309761699e+04, - "cpu_time": 4.3422541229249036e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0985539789494189e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.4162649819187213e-03, - "cpu_time": 5.7157704757660882e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3907650214092733e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 94, - "real_time": 7.7399991036571087e+06, - "cpu_time": 1.3211916095744595e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1675992174305105e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 94, - "real_time": 7.7185811019165721e+06, - "cpu_time": 1.3180511202126533e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1736140073509254e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 94, - "real_time": 7.7103018820127277e+06, - "cpu_time": 1.3160238893616913e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1759480052446933e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 94, - "real_time": 7.7503634111440564e+06, - "cpu_time": 1.3227530500000257e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1647005578959632e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 94, - "real_time": 7.7480791146530118e+06, - "cpu_time": 1.3228182372340646e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1653387570954542e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7334649226766955e+06, - "cpu_time": 1.3201675812765788e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1694401090035095e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7399991036571087e+06, - "cpu_time": 1.3211916095744593e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1675992174305105e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8026949366195702e+04, - "cpu_time": 3.0169873052337225e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0608165065807318e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3310313742208378e-03, - "cpu_time": 2.2853063111247956e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3327753947101678e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3690888352107769e+07, - "cpu_time": 2.4924777431373980e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4508586394858856e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3777480022433925e+07, - "cpu_time": 2.4962129294116423e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4354549558673415e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3766923188871028e+07, - "cpu_time": 2.4977280450981177e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4373225258585663e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3771114523942564e+07, - "cpu_time": 2.5017988784312885e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4365807096921611e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3747983502552791e+07, - "cpu_time": 2.4978628647059564e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4406802636742659e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3750877917981615e+07, - "cpu_time": 2.4972160921568803e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4401794189156442e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3766923188871026e+07, - "cpu_time": 2.4977280450981177e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4373225258585663e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5290822299966429e+04, - "cpu_time": 3.3593387557687114e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2795241572590517e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5664413945394472e-03, - "cpu_time": 1.3452335047493642e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5733862471676440e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5406183076224156e+07, - "cpu_time": 4.8230400071430169e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6414382592874575e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.5257250826273646e+07, - "cpu_time": 4.8117533214285195e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6570138001793356e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.5353331717529468e+07, - "cpu_time": 4.8213626785716154e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6469445809996037e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5161444608654294e+07, - "cpu_time": 4.8029329178571545e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6671308044418826e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5344080225165401e+07, - "cpu_time": 4.8156991214288577e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6479108100898552e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5304458090769395e+07, - "cpu_time": 4.8149576092858337e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6520876509996271e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5344080225165401e+07, - "cpu_time": 4.8156991214288577e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6479108100898552e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6161192121333836e+04, - "cpu_time": 8.0895082134647426e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0097897356293537e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8001680089885699e-03, - "cpu_time": 1.6800788023271088e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8075277611912370e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.4647005945444107e+07, - "cpu_time": 8.5390817733332366e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.0061977316912537e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.5632461706797279e+07, - "cpu_time": 8.7460906333330959e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9412773928873382e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5618819197018944e+07, - "cpu_time": 8.7439859466667250e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9421569949090385e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.5584910611311592e+07, - "cpu_time": 8.7485630799998626e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9443455345220037e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.5802521457274757e+07, - "cpu_time": 8.7765852599992901e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9303567517609310e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5457143783569336e+07, - "cpu_time": 8.7108613386664420e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9528668811541133e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time_median", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5618819197018936e+07, - "cpu_time": 8.7460906333330959e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9421569949090385e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6065408118338475e+05, - "cpu_time": 9.6937630797854648e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0300646834653545e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0133810504607418e-02, - "cpu_time": 1.1128363433769793e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0261433398179700e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.7775896303355694e+07, - "cpu_time": 1.6786967612500802e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0581909989535208e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.6567091755568981e+07, - "cpu_time": 1.6536688587500235e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1008949308122182e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.6434991098940372e+07, - "cpu_time": 1.6535480574999896e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1056341024288116e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.6436070501804352e+07, - "cpu_time": 1.6540262425000662e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1055953196576238e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.7697220034897327e+07, - "cpu_time": 1.6755809900000429e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0609346099361138e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6982253938913345e+07, - "cpu_time": 1.6631041820000404e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0862499923576579e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time_median", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6567091755568981e+07, - "cpu_time": 1.6540262425000662e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1008949308122182e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9123391889346915e+05, - "cpu_time": 1.2860337198093049e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4457285887450390e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.9468384364805595e-03, - "cpu_time": 7.7327309601418204e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9245964999636667e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6890264302492142e+08, - "cpu_time": 3.1231735574999672e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1785820658874192e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6815992072224617e+08, - "cpu_time": 3.1316890625001293e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1926211055175433e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6843475401401520e+08, - "cpu_time": 3.1274268149999785e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1874117378134909e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6813463345170021e+08, - "cpu_time": 3.1364125774999249e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1931012723456893e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6891196742653847e+08, - "cpu_time": 3.1299162125000632e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1784065994820089e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6850878372788429e+08, - "cpu_time": 3.1297236450000131e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1860245562092304e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time_median", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6843475401401520e+08, - "cpu_time": 3.1299162125000632e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1874117378134909e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8237954480229574e+05, - "cpu_time": 4.9198790758488711e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2274230148456097e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2691965151192340e-03, - "cpu_time": 1.5719851443461391e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2684768705753112e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.1852456927299500e+08, - "cpu_time": 5.6202723349997544e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3709858754403896e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.2178907096385956e+08, - "cpu_time": 5.6449743949997354e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3367877311177950e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.2179450988769531e+08, - "cpu_time": 5.6493086199998283e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3367313332186136e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2008592784404755e+08, - "cpu_time": 5.6290241149997652e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3545424231306701e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.2134233415126801e+08, - "cpu_time": 5.6502436350001514e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3414266029901590e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2070728242397314e+08, - "cpu_time": 5.6387646199998474e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3480947931795259e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time_median", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2134233415126801e+08, - "cpu_time": 5.6449743949997354e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3414266029901590e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4058750755873274e+06, - "cpu_time": 1.3400998741498562e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4722569529556992e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.3836705701268391e-03, - "cpu_time": 2.3765841712858949e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3972976988431289e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 313, - "real_time": 2.2324283009234327e+06, - "cpu_time": 2.5812123961661644e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8347733713578663e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 313, - "real_time": 2.2323332896557287e+06, - "cpu_time": 2.5740498913735198e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8348514619121621e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 313, - "real_time": 2.2401686559934109e+06, - "cpu_time": 2.5877909392969590e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8284337605748768e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 313, - "real_time": 2.2318731582821747e+06, - "cpu_time": 2.5732157635785099e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8352297417979629e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 313, - "real_time": 2.2398092800352615e+06, - "cpu_time": 2.5874094025556738e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8287271315955599e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2353225369780017e+06, - "cpu_time": 2.5807356785941655e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8324030934476857e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time_median", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2324283009234322e+06, - "cpu_time": 2.5812123961661644e+06, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.8347733713578663e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2669118825931819e+03, - "cpu_time": 6.9962744970135082e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4953885835622991e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9088573626433998e-03, - "cpu_time": 2.7109612793917242e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9075434854160221e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 313, - "real_time": 2.2332967845157692e+06, - "cpu_time": 2.5764134536740705e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6681197307935120e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 313, - "real_time": 2.2381080378489657e+06, - "cpu_time": 2.5875397667734069e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6602343861261001e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 313, - "real_time": 2.2324645719208275e+06, - "cpu_time": 2.5757751693291152e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6694871233506510e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 313, - "real_time": 2.2447810466654194e+06, - "cpu_time": 2.5886802747602728e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6493536918306863e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 313, - "real_time": 2.2324860325089088e+06, - "cpu_time": 2.5757952012779065e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6694518490642831e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2362272946919780e+06, - "cpu_time": 2.5808407731629545e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6633293562330473e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time_median", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2332967845157692e+06, - "cpu_time": 2.5764134536740701e+06, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.6681197307935120e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3255723381542603e+03, - "cpu_time": 6.6530744094418988e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7070192690025233e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3814986744841666e-03, - "cpu_time": 2.5778709320715704e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3768049286062107e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 312, - "real_time": 2.2470296617263020e+06, - "cpu_time": 2.5974814775640182e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2914035266507501e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 312, - "real_time": 2.2415916699593742e+06, - "cpu_time": 2.5863581378203915e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.3090921150224190e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 312, - "real_time": 2.2418732174302046e+06, - "cpu_time": 2.5981542532054372e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.3081741967462879e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 312, - "real_time": 2.2418619482778013e+06, - "cpu_time": 2.5867965705128447e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.3082109326964542e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 312, - "real_time": 2.2509142835564814e+06, - "cpu_time": 2.6016785096152406e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2788200420111110e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2446541561900331e+06, - "cpu_time": 2.5940937897435864e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.2991401626254059e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time_median", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2418732174302042e+06, - "cpu_time": 2.5974814775640178e+06, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 7.3081741967462879e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1755565054425297e+03, - "cpu_time": 7.0459471861386210e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3561865990365228e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8602226511944796e-03, - "cpu_time": 2.7161497452391956e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8580087089993900e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 311, - "real_time": 2.2531404710970698e+06, - "cpu_time": 2.6012761800642502e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4543256588012477e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 311, - "real_time": 2.2526733432013025e+06, - "cpu_time": 2.6134362218649397e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4546272365185881e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 311, - "real_time": 2.2530468634458506e+06, - "cpu_time": 2.6019232765274774e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4543860818715520e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 311, - "real_time": 2.2590538386519030e+06, - "cpu_time": 2.6138499967843820e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4505187720339769e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 311, - "real_time": 2.2529583735768818e+06, - "cpu_time": 2.6018617491959147e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4544432060667098e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2541745779946013e+06, - "cpu_time": 2.6064694848873927e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4536601910584150e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time_median", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2530468634458506e+06, - "cpu_time": 2.6019232765274774e+06, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.4543860818715520e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7331831637405398e+03, - "cpu_time": 6.5550940803797275e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7597277986639368e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2124984419672065e-03, - "cpu_time": 2.5149322170801959e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2105496246565526e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 306, - "real_time": 2.3002298137940029e+06, - "cpu_time": 2.6653100816994156e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8491066243465826e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 306, - "real_time": 2.2892530397298969e+06, - "cpu_time": 2.6482166960787713e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8627678488408785e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 306, - "real_time": 2.2972905833359347e+06, - "cpu_time": 2.6626812222219002e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8527518667157058e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 306, - "real_time": 2.2892551161835785e+06, - "cpu_time": 2.6484315751635567e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8627652521862738e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 306, - "real_time": 2.2896608951032842e+06, - "cpu_time": 2.6486089705881984e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8622579064068671e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2931378896293393e+06, - "cpu_time": 2.6546497091503688e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8579298996992618e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time_median", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2896608951032842e+06, - "cpu_time": 2.6486089705881989e+06, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.8622579064068671e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2392206644280550e+03, - "cpu_time": 8.5832411555367944e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5226574561772752e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2847386056121192e-03, - "cpu_time": 3.2332857800225156e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2823014157427901e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 296, - "real_time": 2.3660522923376914e+06, - "cpu_time": 2.7444166317565078e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5396915961861141e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 296, - "real_time": 2.3768231637675213e+06, - "cpu_time": 2.7601136114863744e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5145877908828825e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 296, - "real_time": 2.3659539119516676e+06, - "cpu_time": 2.7443493986484902e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5399219459807292e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 296, - "real_time": 2.3716042106153090e+06, - "cpu_time": 2.7547469256757190e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5267231949294597e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 296, - "real_time": 2.3651766296589393e+06, - "cpu_time": 2.7531854932434312e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5417425640173309e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3691220416662260e+06, - "cpu_time": 2.7513624121621051e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5325334183993034e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time_median", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3660522923376919e+06, - "cpu_time": 2.7531854932434317e+06, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 5.5396915961861141e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0123628921051804e+03, - "cpu_time": 6.8700121896886430e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1688054326961352e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1157048070769447e-03, - "cpu_time": 2.4969492057173148e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1126043790519011e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 282, - "real_time": 2.4803442911885628e+06, - "cpu_time": 2.8931453333332180e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0568855337191215e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 282, - "real_time": 2.4768010612431886e+06, - "cpu_time": 2.8864208758863024e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0583974793212549e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 282, - "real_time": 2.4805485480630123e+06, - "cpu_time": 2.8937656347516938e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0567985061397028e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 282, - "real_time": 2.4860192342918920e+06, - "cpu_time": 2.8956457375884317e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0544729356233966e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 282, - "real_time": 2.4756004543420165e+06, - "cpu_time": 2.8851865000003711e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0589107767378989e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4798627178257350e+06, - "cpu_time": 2.8908328163120039e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0570930463082750e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time_median", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4803442911885628e+06, - "cpu_time": 2.8931453333332185e+06, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.0568855337191215e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0664973270655782e+03, - "cpu_time": 4.7026449045999198e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7320857936314816e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6398074368531796e-03, - "cpu_time": 1.6267439881215079e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6385367396753849e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 271, - "real_time": 2.5776647902489039e+06, - "cpu_time": 3.0537243394838292e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0339650135399252e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 271, - "real_time": 2.5725506462596660e+06, - "cpu_time": 3.0518481180814891e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0380084674417713e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 271, - "real_time": 2.5716839182943217e+06, - "cpu_time": 3.0501633726935224e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0386953321531671e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 271, - "real_time": 2.5735301604817496e+06, - "cpu_time": 3.0530910738011748e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0372327787363347e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 271, - "real_time": 2.5681633247935465e+06, - "cpu_time": 3.0499665498160115e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0414900989295426e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5727185680156378e+06, - "cpu_time": 3.0517586907752054e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0378783381601483e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time_median", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5725506462596660e+06, - "cpu_time": 3.0518481180814891e+06, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0380084674417713e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4268329138294066e+03, - "cpu_time": 1.6884775391976189e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7138572746185458e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3319890315373886e-03, - "cpu_time": 5.5328016081399706e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3317072093070529e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 256, - "real_time": 2.7306286146995262e+06, - "cpu_time": 3.3438218359380658e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8400535113244742e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 256, - "real_time": 2.7362186674508848e+06, - "cpu_time": 3.3499578242190965e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8322083409250110e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 256, - "real_time": 2.7446712310847943e+06, - "cpu_time": 3.3595292734371894e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8204065686423379e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 256, - "real_time": 2.7349611391400686e+06, - "cpu_time": 3.3473907539063320e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8339703807626867e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 256, - "real_time": 2.7330592747603077e+06, - "cpu_time": 3.3449752460938953e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8366383403519899e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7359077854271168e+06, - "cpu_time": 3.3491349867189159e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8326554284013003e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time_median", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7349611391400686e+06, - "cpu_time": 3.3473907539063320e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.8339703807626867e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3332547098991436e+03, - "cpu_time": 6.2708376499315145e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4592018817028939e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9493547035126192e-03, - "cpu_time": 1.8723753072953729e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9462229310852294e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 229, - "real_time": 3.0630223644189700e+06, - "cpu_time": 3.9972968689955338e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8466754417505288e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 229, - "real_time": 3.0664033358143927e+06, - "cpu_time": 4.0031437248906191e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8391263977118862e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 229, - "real_time": 3.0631174081245102e+06, - "cpu_time": 3.9957984716161126e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8464630002022910e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 229, - "real_time": 3.0646824804602363e+06, - "cpu_time": 4.0056186288204445e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8429666478370774e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 229, - "real_time": 3.0758971374839805e+06, - "cpu_time": 4.0085722096067532e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8180173336856985e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0666245452604177e+06, - "cpu_time": 4.0020859807858923e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8386497642374969e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time_median", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0646824804602358e+06, - "cpu_time": 4.0031437248906181e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 6.8429666478370774e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3637028618004133e+03, - "cpu_time": 5.4345642039323957e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1937524970612626e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7490575656189198e-03, - "cpu_time": 1.3579328955009621e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7455967745328232e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 195, - "real_time": 3.5827156502562454e+06, - "cpu_time": 5.0722837435900243e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1707052441351330e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 195, - "real_time": 3.5791595681355549e+06, - "cpu_time": 5.0674617948714467e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1718684009902594e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 195, - "real_time": 3.5798438287411747e+06, - "cpu_time": 5.0671404205133561e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1716444070340621e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 195, - "real_time": 3.5828740097200260e+06, - "cpu_time": 5.0715463025636170e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1706535001290076e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 195, - "real_time": 3.5798430645790622e+06, - "cpu_time": 5.0679551282043504e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1716446571361613e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5808872242864133e+06, - "cpu_time": 5.0692774779485594e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1713032418849247e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time_median", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5798438287411742e+06, - "cpu_time": 5.0679551282043504e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1716444070340621e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7645252482931708e+03, - "cpu_time": 2.4391354296275222e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7708935765616060e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9276202733382628e-04, - "cpu_time": 4.8116037053363162e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9268996876289449e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 143, - "real_time": 4.9000680479188478e+06, - "cpu_time": 7.6252534755230248e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7119370420912421e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 143, - "real_time": 4.9016042286855774e+06, - "cpu_time": 7.6305747972036079e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7114005147350509e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 143, - "real_time": 4.9158946734729344e+06, - "cpu_time": 7.6462645734272571e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7064254946849167e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 143, - "real_time": 4.9079180682091033e+06, - "cpu_time": 7.6303466783212777e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7091988666919615e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 143, - "real_time": 4.9081676105571380e+06, - "cpu_time": 7.6302748531475915e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7091119671538253e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9067305257687215e+06, - "cpu_time": 7.6325428755245525e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7096147770713995e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time_median", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9079180682091024e+06, - "cpu_time": 7.6303466783212777e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.7091988666919615e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.2873803320788866e+03, - "cpu_time": 7.9884429904415501e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1896971950660208e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2813787712733348e-03, - "cpu_time": 1.0466292978265829e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2808132126799999e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 89, - "real_time": 7.7203619869404966e+06, - "cpu_time": 1.3212402157304484e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1731126116080790e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 89, - "real_time": 7.7318281374788014e+06, - "cpu_time": 1.3214605853933249e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1698899279298677e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 89, - "real_time": 7.7357292018328486e+06, - "cpu_time": 1.3231777056180464e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1687956703583841e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 89, - "real_time": 7.7150531604969772e+06, - "cpu_time": 1.3197678101122301e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1746079581024261e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 89, - "real_time": 7.7599720098078251e+06, - "cpu_time": 1.3251760617976379e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1620201695051584e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7325888993113907e+06, - "cpu_time": 1.3221644757303378e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1696852675007830e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time_median", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7318281374788014e+06, - "cpu_time": 1.3214605853933249e+07, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 2.1698899279298677e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7444730728875547e+04, - "cpu_time": 2.0730418281153361e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8879076977209784e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2560013154752159e-03, - "cpu_time": 1.5679152376032708e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2528187709691468e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3748664317616060e+07, - "cpu_time": 2.4998421686275691e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4405594045238967e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.3736212498270998e+07, - "cpu_time": 2.4962059941175289e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4427717614461451e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3751842227636600e+07, - "cpu_time": 2.4942051784311093e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4399954162189865e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3720504063017229e+07, - "cpu_time": 2.4946444137256939e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4455684605964222e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.3836699063140972e+07, - "cpu_time": 2.5034637274511982e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4250315661908340e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3758784433936372e+07, - "cpu_time": 2.4976722964706205e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4387853217952571e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time_median", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3748664317616060e+07, - "cpu_time": 2.4962059941175289e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 2.4405594045238967e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5266376882118348e+04, - "cpu_time": 3.9239024573674207e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9950010060487175e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2899982625258480e-03, - "cpu_time": 1.5710237339430638e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2782717423292416e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 28, - "real_time": 2.5281045253255539e+07, - "cpu_time": 4.8095119071433604e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6545130285448990e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 28, - "real_time": 2.5450983350830417e+07, - "cpu_time": 4.8336290535717450e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6367886487894921e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 28, - "real_time": 2.4401332384773664e+07, - "cpu_time": 4.6467884499999657e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.7502131007352562e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 28, - "real_time": 2.5301331055483647e+07, - "cpu_time": 4.8096103750002131e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6523847244572239e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 28, - "real_time": 2.5464212056249380e+07, - "cpu_time": 4.8321747892860651e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6354188321931705e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5179780820118532e+07, - "cpu_time": 4.7863429150002703e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6658636669440084e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time_median", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5301331055483650e+07, - "cpu_time": 4.8096103750002131e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 2.6523847244572239e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4313171077511215e+05, - "cpu_time": 7.8883086265144416e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7952034647194691e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7598711995977821e-02, - "cpu_time": 1.6480868100345870e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7987429455522053e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.5753678679466248e+07, - "cpu_time": 8.7545924466667205e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9334849540794511e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.5796846101681389e+07, - "cpu_time": 8.7664055533332422e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9307198950338268e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.5672675222158432e+07, - "cpu_time": 8.7580612333325312e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9386876802627773e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.5649827520052589e+07, - "cpu_time": 8.7516358333323300e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9401584910927033e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.5335542162259422e+07, - "cpu_time": 8.6742319933334038e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9605409265786290e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5641713937123619e+07, - "cpu_time": 8.7409854119996458e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9407183894094772e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time_median", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5672675222158432e+07, - "cpu_time": 8.7545924466667205e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 2.9386876802627773e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8122339744764121e+05, - "cpu_time": 3.7723895047487400e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1722443453191830e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.9705651215748827e-03, - "cpu_time": 4.3157485420007623e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9862516232116339e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.6650948971509933e+07, - "cpu_time": 1.6582115187500790e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0978940125428886e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.6741509847342968e+07, - "cpu_time": 1.6585116962500024e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0946597133531752e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.6083027534186840e+07, - "cpu_time": 1.6336479762500745e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1183319603088317e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.6600691080093384e+07, - "cpu_time": 1.6543075075000501e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0996918460123510e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.6626107804477215e+07, - "cpu_time": 1.6561568275000128e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0987823740838337e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6540457047522068e+07, - "cpu_time": 1.6521671052500439e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.1018719812602162e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time_median", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6626107804477215e+07, - "cpu_time": 1.6561568275000125e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0987823740838337e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6116883624073552e+05, - "cpu_time": 1.0491021326044858e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3950866941396557e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0178814065809651e-03, - "cpu_time": 6.3498548619615050e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0288441144249471e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6839752346277237e+08, - "cpu_time": 3.1375624350005180e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1881164340203972e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6750003397464752e+08, - "cpu_time": 3.0942789124998170e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2051988245044756e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6839155182242393e+08, - "cpu_time": 3.1371546950003904e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1882294936396408e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6772347316145897e+08, - "cpu_time": 3.0947776750002730e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.2009288973117156e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6858127713203430e+08, - "cpu_time": 3.1407821774996591e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1846413856475778e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6811877191066742e+08, - "cpu_time": 3.1209111790001321e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1934230070247612e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time_median", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6839155182242393e+08, - "cpu_time": 3.1371546950003904e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.1882294936396408e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7568900618690113e+05, - "cpu_time": 2.4125766153899645e+06, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0451290575204063e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8294818049210235e-03, - "cpu_time": 7.7303597475750600e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8324243414114890e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 3.2177326083183289e+08, - "cpu_time": 5.6083072799992812e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3369516821385775e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 3.2265895605087280e+08, - "cpu_time": 5.6123499699992859e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3277917871608868e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 3.2221984863281250e+08, - "cpu_time": 5.6153820149995685e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3323267593722591e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 3.2266318798065186e+08, - "cpu_time": 5.6155443199997985e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3277481410875597e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 3.2165689766407013e+08, - "cpu_time": 5.6065007950007844e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3381588636764979e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2219443023204809e+08, - "cpu_time": 5.6116168759997439e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3325954466871562e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time_median", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2221984863281250e+08, - "cpu_time": 5.6123499699992871e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.3323267593722591e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7499712721900782e+05, - "cpu_time": 4.1007994750966743e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9135553623501584e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_managed_GPUWrGPU_fine/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4742561715822011e-03, - "cpu_time": 7.3076968112975311e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4743929891744261e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - } - ] -} diff --git a/results/implicit_managed_HostWrGPU_fine.json b/results/implicit_managed_HostWrGPU_fine.json deleted file mode 100644 index 7dcff17..0000000 --- a/results/implicit_managed_HostWrGPU_fine.json +++ /dev/null @@ -1,38 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:54:29-04:00", - "host_name": "frontier01017", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1813, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [12.35,15.21,12.5], - "library_build_type": "release" - }, - "benchmarks": [ diff --git a/results/implicit_mapped_GPURdHost.json b/results/implicit_mapped_GPURdHost.json deleted file mode 100644 index 4164a67..0000000 --- a/results/implicit_mapped_GPURdHost.json +++ /dev/null @@ -1,1698 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:57:39-04:00", - "host_name": "frontier01024", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1881, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [0.74,7.12,7.18], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52418, - "real_time": 1.3358390169694165e+04, - "cpu_time": 2.0462372448395596e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0662377337147182e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52418, - "real_time": 1.3356491396170082e+04, - "cpu_time": 2.0460801575794569e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0666736334472620e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52418, - "real_time": 1.3361756165410265e+04, - "cpu_time": 2.0413873516730895e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0654653095701319e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52418, - "real_time": 1.3352849635545979e+04, - "cpu_time": 2.0423873764737313e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0675100160614675e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52418, - "real_time": 1.3351372984195657e+04, - "cpu_time": 2.0422418844671676e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0678492802564454e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3356172070203233e+04, - "cpu_time": 2.0436668030066015e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0667471946100050e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3356491396170084e+04, - "cpu_time": 2.0423873764737313e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.0666736334472620e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1914750407985126e+00, - "cpu_time": 2.3073076834768418e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6237729607467365e+04, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1382307885576189e-04, - "cpu_time": 1.1290038474385245e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1381044311905147e-04, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52340, - "real_time": 1.3375127635009039e+04, - "cpu_time": 2.0505235364921678e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1248013653026080e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52340, - "real_time": 1.3377205640093345e+04, - "cpu_time": 2.0507505464272057e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1238499432552922e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52340, - "real_time": 1.3370425115816619e+04, - "cpu_time": 2.0464759705769950e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1269555223859179e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52340, - "real_time": 1.3372914165293721e+04, - "cpu_time": 2.0560072888803952e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1258151355374908e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52340, - "real_time": 1.3373014663519929e+04, - "cpu_time": 2.0565893714176538e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1257691000271237e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3373737443946531e+04, - "cpu_time": 2.0520693427588834e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1254382133016860e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3373014663519929e+04, - "cpu_time": 2.0507505464272057e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.1257691000271237e+08, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5560092295271906e+00, - "cpu_time": 4.2235243538726742e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1706793309869274e+05, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9112153504136114e-04, - "cpu_time": 2.0581781842685686e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9111764582732064e-04, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52093, - "real_time": 1.3435814949350908e+04, - "cpu_time": 2.0616280517535961e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2194273337168522e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52093, - "real_time": 1.3435559982769335e+04, - "cpu_time": 2.0627498397097490e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2194504747857137e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52093, - "real_time": 1.3435093526082268e+04, - "cpu_time": 2.0550394045265166e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2194928132203071e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52093, - "real_time": 1.3438097386303059e+04, - "cpu_time": 2.0634596759641423e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2192202161519969e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52093, - "real_time": 1.3435084102712914e+04, - "cpu_time": 2.0628576948918344e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2194936685726902e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3435929989443699e+04, - "cpu_time": 2.0611469333691679e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2194169012895119e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3435559982769337e+04, - "cpu_time": 2.0627498397097494e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.2194504747857137e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2512936883410561e+00, - "cpu_time": 3.4777210746793358e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1355273805593593e+05, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.3130411465687082e-05, - "cpu_time": 1.6872747004963030e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3120521731210958e-05, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50970, - "real_time": 1.3730673399225387e+04, - "cpu_time": 2.0828173337257205e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.3864816420328374e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50970, - "real_time": 1.3730441031465822e+04, - "cpu_time": 2.0821078359819559e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.3865220297662778e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50970, - "real_time": 1.3730653643990508e+04, - "cpu_time": 2.0806441553855213e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.3864850756279593e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50970, - "real_time": 1.3731015816575458e+04, - "cpu_time": 2.0824535471846157e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.3864221291220102e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50970, - "real_time": 1.3730094764492513e+04, - "cpu_time": 2.0814677104178867e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.3865822168060732e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3730575731149938e+04, - "cpu_time": 2.0818981165391404e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.3864986186710315e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3730653643990508e+04, - "cpu_time": 2.0821078359819556e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.3864850756279593e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3865817261176245e-01, - "cpu_time": 8.5952220550092662e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8862138595195465e+04, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4664528221017263e-05, - "cpu_time": 4.1285507617911689e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4664643899091801e-05, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49187, - "real_time": 1.4229580193373125e+04, - "cpu_time": 2.1638558826519231e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.6056172500802832e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49187, - "real_time": 1.4231293878500532e+04, - "cpu_time": 2.1656113464939910e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.6050626569525347e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49187, - "real_time": 1.4233649316842781e+04, - "cpu_time": 2.1648352959115207e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.6043005936960077e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49187, - "real_time": 1.4231573812434501e+04, - "cpu_time": 2.1642227661780566e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.6049720757334290e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49187, - "real_time": 1.4233639008730754e+04, - "cpu_time": 2.1635782157887294e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.6043039281662941e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4231947241976337e+04, - "cpu_time": 2.1644207014048443e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.6048513009257097e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4231573812434499e+04, - "cpu_time": 2.1642227661780566e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 4.6049720757334290e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7268747952230747e+00, - "cpu_time": 8.1509277349318072e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5875563231165730e+05, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2133791433190205e-04, - "cpu_time": 3.7658703456501530e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2134064615709330e-04, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 45925, - "real_time": 1.5234444857167735e+04, - "cpu_time": 2.3655564746869877e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6036610607659416e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 45925, - "real_time": 1.5238500404311129e+04, - "cpu_time": 2.3678326663037638e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6013712978554230e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 45925, - "real_time": 1.5239364961775815e+04, - "cpu_time": 2.3689270898203635e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6008833260940838e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 45925, - "real_time": 1.5239027913773058e+04, - "cpu_time": 2.3616169145345641e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6010735554553928e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 45925, - "real_time": 1.5238414761358836e+04, - "cpu_time": 2.3608568600979812e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6014196392900963e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5237950579677316e+04, - "cpu_time": 2.3649580010887323e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6016817758921871e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5238500404311129e+04, - "cpu_time": 2.3655564746869873e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 8.6013712978554230e+09, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9980607697744326e+00, - "cpu_time": 3.6179328659096058e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1280663764867738e+06, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3112398280377833e-04, - "cpu_time": 1.5298085057933602e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3114486281605878e-04, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 37024, - "real_time": 1.8903840236089778e+04, - "cpu_time": 2.9221954380942087e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3867235266807562e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 37024, - "real_time": 1.8908442559862226e+04, - "cpu_time": 2.9241503268150409e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3863859975250658e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 37024, - "real_time": 1.8903118840240546e+04, - "cpu_time": 2.9252199114088147e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3867764479264318e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 37024, - "real_time": 1.8898801074573792e+04, - "cpu_time": 2.9261104661840949e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3870932815557556e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 37024, - "real_time": 1.8904247278792791e+04, - "cpu_time": 2.9266923428046783e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3866936680101461e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8903689997911828e+04, - "cpu_time": 2.9248736970613681e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3867345843396311e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8903840236089782e+04, - "cpu_time": 2.9252199114088151e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.3867235266807562e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4332117268321070e+00, - "cpu_time": 1.7785717703593466e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5185583198012309e+06, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8161595578489452e-04, - "cpu_time": 6.0808498231779530e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8161790642876185e-04, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 23887, - "real_time": 2.9311693284488039e+04, - "cpu_time": 4.4401035249298569e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7886650044794819e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 23887, - "real_time": 2.9314942598556816e+04, - "cpu_time": 4.4156121907313784e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7884667460539761e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 23887, - "real_time": 2.9294042889368237e+04, - "cpu_time": 4.3973727550550357e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7897427199790207e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 23887, - "real_time": 2.9288786251919788e+04, - "cpu_time": 4.3989489973625939e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7900639360418514e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 23887, - "real_time": 2.9298136159463975e+04, - "cpu_time": 4.3979957257085392e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7894926733441467e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9301520236759370e+04, - "cpu_time": 4.4100066387574807e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7892862159796955e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9298136159463978e+04, - "cpu_time": 4.3989489973625939e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.7894926733441467e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1326603301115782e+01, - "cpu_time": 1.8462077707425183e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9161111270192880e+06, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8655343509809843e-04, - "cpu_time": 4.1864058763927108e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8652905640546053e-04, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 14022, - "real_time": 4.9914346831678551e+04, - "cpu_time": 7.6438336257309769e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.1007507190988876e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 14022, - "real_time": 4.9917118198893630e+04, - "cpu_time": 7.6495473826843867e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.1006340867314747e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 14022, - "real_time": 4.9931645792176256e+04, - "cpu_time": 7.6462936670945623e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.1000229080458241e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 14022, - "real_time": 4.9923556309128930e+04, - "cpu_time": 7.6362129938667829e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.1003631902887081e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 14022, - "real_time": 4.9924856206020559e+04, - "cpu_time": 7.6365696762231004e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.1003085029888374e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9922304667579599e+04, - "cpu_time": 7.6424914691199621e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.1004158814307465e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9923556309128930e+04, - "cpu_time": 7.6438336257309755e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 2.1003631902887081e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8110236250369214e+00, - "cpu_time": 5.9272863232660242e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8655906054564039e+06, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3643247583199254e-04, - "cpu_time": 7.7556989722731798e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3642967713158030e-04, - "own_numa": NaN, - "rd_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7691, - "real_time": 9.1018540574250248e+04, - "cpu_time": 1.3152713223247961e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3040931954838425e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7691, - "real_time": 9.1014194496523560e+04, - "cpu_time": 1.3160289910284677e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3042032197297581e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7691, - "real_time": 9.1022912875129841e+04, - "cpu_time": 1.3161464269925884e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3039825179809250e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7691, - "real_time": 9.1043195351036164e+04, - "cpu_time": 1.3161925939409694e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3034692399733887e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7691, - "real_time": 9.1029068535830927e+04, - "cpu_time": 1.3161493446885981e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3038267157205036e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1025582366554154e+04, - "cpu_time": 1.3159577357950842e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3039149777776836e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1022912875129856e+04, - "cpu_time": 1.3161464269925884e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3039825179809250e+10, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1277934269366469e+01, - "cpu_time": 3.8849628167120308e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8542907817669874e+06, - "own_numa": 0.0000000000000000e+00, - "rd_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPURdHost/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2389851266153898e-04, - "cpu_time": 2.9521942164539107e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2388872025651687e-04, - "own_numa": NaN, - "rd_gpu": NaN - } \ No newline at end of file diff --git a/results/implicit_mapped_GPUWrGPU.json b/results/implicit_mapped_GPUWrGPU.json deleted file mode 100644 index e6a6e94..0000000 --- a/results/implicit_mapped_GPUWrGPU.json +++ /dev/null @@ -1,6180 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:53:41-04:00", - "host_name": "frontier10355", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1795, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [0.32,1.87,5.8], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 57077, - "real_time": 1.2265398267579003e+04, - "cpu_time": 2.8594602764686297e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3394757435858512e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 57077, - "real_time": 1.2260957366303213e+04, - "cpu_time": 2.8522828109396072e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3406852969385868e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 57077, - "real_time": 1.2260377543855271e+04, - "cpu_time": 2.8577834469225771e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3408432859009773e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 57077, - "real_time": 1.2255939666425886e+04, - "cpu_time": 2.8544030152250463e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3420530057117099e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 57077, - "real_time": 1.2257770203752671e+04, - "cpu_time": 2.8534439301294744e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3415539138970190e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2260088609583210e+04, - "cpu_time": 2.8554746959370670e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3409222492068291e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2260377543855273e+04, - "cpu_time": 2.8544030152250467e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3408432859009773e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5923329537607622e+00, - "cpu_time": 3.0280283364606639e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7882207882740360e+04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9301035809421331e-04, - "cpu_time": 1.0604290560757258e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9297960437714063e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 57089, - "real_time": 1.2263251255269017e+04, - "cpu_time": 2.8484953248436661e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6801208174546981e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 57089, - "real_time": 1.2257550844182846e+04, - "cpu_time": 2.8437676154775851e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6832274278411305e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 57089, - "real_time": 1.2260639383155847e+04, - "cpu_time": 2.8456206764875882e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6815438771117389e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 57089, - "real_time": 1.2257108153272411e+04, - "cpu_time": 2.8457499465746499e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6834688064760983e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 57089, - "real_time": 1.2260407201787124e+04, - "cpu_time": 2.8450703095167213e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6816704087984145e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2259791367533448e+04, - "cpu_time": 2.8457407745800425e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6820062675364161e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2260407201787126e+04, - "cpu_time": 2.8456206764875882e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6816704087984145e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5143979973389525e+00, - "cpu_time": 1.7280722700095616e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3703813950867837e+05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0509304946229482e-04, - "cpu_time": 6.0724865927557306e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0508532021955566e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 57127, - "real_time": 1.2251652165090634e+04, - "cpu_time": 2.8713939835804464e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3372890267554209e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 57127, - "real_time": 1.2252987227658265e+04, - "cpu_time": 2.8679777338211348e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3371433182446268e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 57127, - "real_time": 1.2251170643742193e+04, - "cpu_time": 2.8698282475887063e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3373415877093203e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 57127, - "real_time": 1.2246266687984305e+04, - "cpu_time": 2.8688373991282540e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3378771194061551e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 57127, - "real_time": 1.2247364340370736e+04, - "cpu_time": 2.8683761391286054e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3377572140965676e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2249888212969228e+04, - "cpu_time": 2.8692827006494295e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3374816532424181e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2251170643742193e+04, - "cpu_time": 2.8688373991282540e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3373415877093203e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9088409966533293e+00, - "cpu_time": 1.3673169656350671e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1761657689736533e+05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3745857481161954e-04, - "cpu_time": 4.7653616192144138e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3747359534044947e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 57075, - "real_time": 1.2253948088062472e+04, - "cpu_time": 2.9031500359176487e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6740769394903722e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 57075, - "real_time": 1.2255974268358494e+04, - "cpu_time": 2.8992073622426688e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6736348561532016e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 57075, - "real_time": 1.2258345468525182e+04, - "cpu_time": 2.9036876723609221e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6731176800438437e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 57075, - "real_time": 1.2255015756808267e+04, - "cpu_time": 2.8999440402978482e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6738439713384910e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 57075, - "real_time": 1.2257833172413013e+04, - "cpu_time": 2.9124508261060022e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6732293986302853e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2256223350833487e+04, - "cpu_time": 2.9036879873850186e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6735805691312389e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2255974268358494e+04, - "cpu_time": 2.9031500359176491e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6736348561532016e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8568827976926816e+00, - "cpu_time": 5.2718563094567529e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0506121848431748e+05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5150530016788604e-04, - "cpu_time": 1.8155725864349641e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5150514750185339e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 57110, - "real_time": 1.2261983400761912e+04, - "cpu_time": 2.9679773332166071e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3446492184884090e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 57110, - "real_time": 1.2259938612186901e+04, - "cpu_time": 2.9649723113290063e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3455406322226133e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 57110, - "real_time": 1.2260207128927859e+04, - "cpu_time": 2.9707655962178229e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3454235569453268e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 57110, - "real_time": 1.2262126317861161e+04, - "cpu_time": 2.9665830187357671e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3445869257226191e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 57110, - "real_time": 1.2260032622836925e+04, - "cpu_time": 2.9678303764664659e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3454996423031721e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2260857616514952e+04, - "cpu_time": 2.9676257271931339e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3451399951364288e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2260207128927859e+04, - "cpu_time": 2.9678303764664655e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3454235569453268e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0983295234860022e+00, - "cpu_time": 2.1302665499104908e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7880343657914572e+05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.9580154817766591e-05, - "cpu_time": 7.1783531541403582e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9577342598100618e-05, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 57059, - "real_time": 1.2267836301377924e+04, - "cpu_time": 3.1016258066212096e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0684198645956663e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 57059, - "real_time": 1.2266933372734089e+04, - "cpu_time": 3.0979139960391865e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0684985074699749e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 57059, - "real_time": 1.2268147236702178e+04, - "cpu_time": 3.1007561962179490e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0683927855697443e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 57059, - "real_time": 1.2268124966204010e+04, - "cpu_time": 3.0982571794107811e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0683947250380524e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 57059, - "real_time": 1.2269330816500296e+04, - "cpu_time": 3.0999598415674966e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0682897214225328e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2268074538703699e+04, - "cpu_time": 3.0997026039713248e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0683991208191940e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2268124966204010e+04, - "cpu_time": 3.0999598415674969e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0683947250380524e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5806155455322197e-01, - "cpu_time": 1.5939970765569608e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4725662483513658e+05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.9942642738775589e-05, - "cpu_time": 5.1424193873139299e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9941710946203167e-05, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 56074, - "real_time": 1.2486006628770727e+04, - "cpu_time": 3.2742411723793550e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0995023292391811e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 56074, - "real_time": 1.2487170609526585e+04, - "cpu_time": 3.2698925188144218e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0993066259542233e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 56074, - "real_time": 1.2486579319081178e+04, - "cpu_time": 3.2718561311837864e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0994060366829895e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 56074, - "real_time": 1.2489038854278699e+04, - "cpu_time": 3.2727235242715018e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0989925890909569e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 56074, - "real_time": 1.2487951667418560e+04, - "cpu_time": 3.2721876538146051e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0991753249969852e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2487349415815153e+04, - "cpu_time": 3.2721802000927342e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0992765811928673e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2487170609526587e+04, - "cpu_time": 3.2721876538146054e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0993066259542233e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1879611671687293e+00, - "cpu_time": 1.5717323067201161e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9970473487826972e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5133172590188261e-05, - "cpu_time": 4.8033183095343369e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5130263762001260e-05, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 55853, - "real_time": 1.2526670310007275e+04, - "cpu_time": 3.2784903317637290e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 4.1853739822717140e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 55853, - "real_time": 1.2531316701783719e+04, - "cpu_time": 3.2752745528440697e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 4.1838221192300758e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 55853, - "real_time": 1.2527993499446267e+04, - "cpu_time": 3.2789307933324926e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 4.1849319288294121e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 55853, - "real_time": 1.2531112950772913e+04, - "cpu_time": 3.2782837054410680e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 4.1838901465464981e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 55853, - "real_time": 1.2529007549856315e+04, - "cpu_time": 3.2778326231357147e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 4.1845932162920013e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2529220202373301e+04, - "cpu_time": 3.2777624013034147e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 4.1845222786339401e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2529007549856315e+04, - "cpu_time": 3.2782837054410687e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 4.1845932162920013e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0018602865659232e+00, - "cpu_time": 1.4457784890890931e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6859155902060261e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5977532952822783e-04, - "cpu_time": 4.4108703196856918e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5977727312730856e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 55525, - "real_time": 1.2613260993542659e+04, - "cpu_time": 3.2935764016208792e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 8.3132823505104431e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 55525, - "real_time": 1.2612980434811965e+04, - "cpu_time": 3.2903763601980965e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 8.3134672682589661e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 55525, - "real_time": 1.2612715185665782e+04, - "cpu_time": 3.2932693867627058e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 8.3136421029446198e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 55525, - "real_time": 1.2612681289105369e+04, - "cpu_time": 3.2924224853669541e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 8.3136644458442245e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 55525, - "real_time": 1.2616224680234156e+04, - "cpu_time": 3.2930877046375608e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 8.3113294711912064e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2613572516671984e+04, - "cpu_time": 3.2925464677172393e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 8.3130771277498917e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2612980434811961e+04, - "cpu_time": 3.2930877046375601e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 8.3134672682589661e+10, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5009065611780898e+00, - "cpu_time": 1.2846255739277908e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.8903602040127944e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1899139273938982e-04, - "cpu_time": 3.9016171420002370e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1897351668971978e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 54888, - "real_time": 1.2782546425658455e+04, - "cpu_time": 3.3315992931059445e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.6406371079477393e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 54888, - "real_time": 1.2779470874477673e+04, - "cpu_time": 3.3264041375164132e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.6410319492869580e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 54888, - "real_time": 1.2754710679581551e+04, - "cpu_time": 3.3298756467716143e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.6442176170700897e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 54888, - "real_time": 1.2752037597304234e+04, - "cpu_time": 3.3270766178399768e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.6445622779871161e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 54888, - "real_time": 1.2778057794508160e+04, - "cpu_time": 3.3306770532721006e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.6412134251743079e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2769364674306013e+04, - "cpu_time": 3.3291265497012100e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.6423324754932422e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2778057794508160e+04, - "cpu_time": 3.3298756467716143e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 1.6412134251743079e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4717602965422369e+01, - "cpu_time": 2.2745008481396535e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8936532861228931e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1525712782748322e-03, - "cpu_time": 6.8321249258121192e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1530267557756061e-03, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 52522, - "real_time": 1.3357488671915737e+04, - "cpu_time": 3.4429442005255158e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1400393464817749e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 52522, - "real_time": 1.3323189900729141e+04, - "cpu_time": 3.4323002322836204e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1481229579790479e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 52522, - "real_time": 1.3356815776056146e+04, - "cpu_time": 3.4423979760862232e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1401975368402124e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 52522, - "real_time": 1.3330796919159478e+04, - "cpu_time": 3.4377367465062154e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1463265290402875e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 52522, - "real_time": 1.3355691748399669e+04, - "cpu_time": 3.4435235577472289e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1404618188365851e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3344796603252038e+04, - "cpu_time": 3.4397805426297607e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1430296378355817e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3355691748399669e+04, - "cpu_time": 3.4423979760862232e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1404618188365851e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6485554722810345e+01, - "cpu_time": 4.7697483377660227e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8848337977911675e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2353545140427939e-03, - "cpu_time": 1.3866432112903000e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2360156426862148e-03, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 48536, - "real_time": 1.4457836294255223e+04, - "cpu_time": 3.7526390308224669e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.8021185392265002e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 48536, - "real_time": 1.4420067014860264e+04, - "cpu_time": 3.7461360248063203e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.8173155446193945e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 48536, - "real_time": 1.4449626825871193e+04, - "cpu_time": 3.7537688293225634e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.8054149779015039e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 48536, - "real_time": 1.4420674030392767e+04, - "cpu_time": 3.7491791247733643e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.8170706738952087e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 48536, - "real_time": 1.4438528572710768e+04, - "cpu_time": 3.7487570607384223e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.8098773415559180e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4437346547618043e+04, - "cpu_time": 3.7500960140926269e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.8103594154397058e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4438528572710766e+04, - "cpu_time": 3.7491791247733650e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.8098773415559180e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6945406586209792e+01, - "cpu_time": 3.0931983069850283e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8194688529398179e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1737202906586420e-03, - "cpu_time": 8.2483176306979370e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1736741852524017e-03, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33718, - "real_time": 2.0753074473605120e+04, - "cpu_time": 4.9258514028115787e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 8.0842074851792053e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33718, - "real_time": 2.0758455854546733e+04, - "cpu_time": 4.9169035441010572e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 8.0821117512578748e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33718, - "real_time": 2.0753131626275914e+04, - "cpu_time": 4.9229324099887126e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 8.0841852218380676e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33718, - "real_time": 2.0761311865410753e+04, - "cpu_time": 4.9167843318109262e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 8.0809999429523389e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33718, - "real_time": 2.0752110331051848e+04, - "cpu_time": 4.9228338780473503e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 8.0845830772670264e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0755616830178078e+04, - "cpu_time": 4.9210611133519255e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 8.0832174956989026e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0753131626275917e+04, - "cpu_time": 4.9228338780473510e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 8.0841852218380676e+11, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0444046874083908e+00, - "cpu_time": 4.0363213850256393e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5749283359776953e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9485832295419627e-04, - "cpu_time": 8.2021362711269898e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9483928730307183e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 21430, - "real_time": 3.2663591698530130e+04, - "cpu_time": 7.3308554596360671e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.0272731887445789e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 21430, - "real_time": 3.2668339937710596e+04, - "cpu_time": 7.3274887167521912e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.0271238778578567e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 21430, - "real_time": 3.2658394100044006e+04, - "cpu_time": 7.3295061735884345e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.0274366797464419e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 21430, - "real_time": 3.2672155943209018e+04, - "cpu_time": 7.3279588940736634e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.0270039130054520e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 21430, - "real_time": 3.2656102280344989e+04, - "cpu_time": 7.3357424125058154e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.0275087857069734e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2663716791967752e+04, - "cpu_time": 7.3303103313112355e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.0272692890122606e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2663591698530130e+04, - "cpu_time": 7.3295061735884345e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.0272731887445789e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6880534408385897e+00, - "cpu_time": 3.3144421245377941e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1033447206976455e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0475481965001707e-04, - "cpu_time": 4.5215577168407703e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0475105633889360e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 11718, - "real_time": 5.9742900005380681e+04, - "cpu_time": 1.2440073468168431e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.1232943829970742e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 11718, - "real_time": 5.9758533825950413e+04, - "cpu_time": 1.2436839204642551e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.1230005106125557e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 11718, - "real_time": 5.9761988769530886e+04, - "cpu_time": 1.2442184016043547e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.1229355880173594e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 11718, - "real_time": 5.9783453167371881e+04, - "cpu_time": 1.2440015326847638e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.1225324139794941e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 11718, - "real_time": 5.9768432359891420e+04, - "cpu_time": 1.2443100819252558e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.1228145251645332e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9763061625625065e+04, - "cpu_time": 1.2440442566990943e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.1229154841542034e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9761988769530879e+04, - "cpu_time": 1.2440073468168429e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.1229355880173594e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4771617049701263e+01, - "cpu_time": 2.4187774842759449e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7754885709660673e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4716968387990891e-04, - "cpu_time": 1.9442857207458585e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4716807365574858e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6365, - "real_time": 1.0986185416665027e+05, - "cpu_time": 2.2184965797328952e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.2216954557894512e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6365, - "real_time": 1.0986862917143913e+05, - "cpu_time": 2.2181887132757259e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.2216201204309785e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6365, - "real_time": 1.0981450986024944e+05, - "cpu_time": 2.2180189363707785e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.2222221650928118e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6365, - "real_time": 1.0983082107573714e+05, - "cpu_time": 2.2179251076197915e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.2220406502055203e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6365, - "real_time": 1.0982735679055638e+05, - "cpu_time": 2.2180216449332525e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.2220791970433804e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0984063421292650e+05, - "cpu_time": 2.2181301963864890e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.2219315177124285e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0983082107573717e+05, - "cpu_time": 2.2180216449332525e+05, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.2220406502055203e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3393768102350741e+01, - "cpu_time": 2.2576790562508606e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6023474257082525e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1297917906229339e-04, - "cpu_time": 1.0178298189749186e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1296998956047008e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3277, - "real_time": 2.1348638472793554e+05, - "cpu_time": 4.2152575007629220e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2573891133249124e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3277, - "real_time": 2.1357305352821908e+05, - "cpu_time": 4.2164461214525177e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2568788597880491e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3277, - "real_time": 2.1347906688194285e+05, - "cpu_time": 4.2149091211474332e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2574322153490059e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3277, - "real_time": 2.1353590140512952e+05, - "cpu_time": 4.2163616173329722e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2570975383231350e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3277, - "real_time": 2.1352511461701119e+05, - "cpu_time": 4.2159660909367853e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2571610439431379e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1351990423204764e+05, - "cpu_time": 4.2157880903265264e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2571917541456482e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1352511461701119e+05, - "cpu_time": 4.2159660909367847e+05, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.2571610439431379e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8402967445671223e+01, - "cpu_time": 6.7965699173690012e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2610553461271098e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7985661610233730e-04, - "cpu_time": 1.6121706717100632e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7984967994509786e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1600, - "real_time": 4.3715133115256322e+05, - "cpu_time": 8.3444874625000055e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2281122662591990e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1600, - "real_time": 4.3744153557781829e+05, - "cpu_time": 8.3477044312500581e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2272975205494490e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1600, - "real_time": 4.3760953161836369e+05, - "cpu_time": 8.3494433874999883e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2268263673657856e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1600, - "real_time": 4.3766004047938623e+05, - "cpu_time": 8.3500025562498684e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2266847834952998e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1600, - "real_time": 4.3743884067225741e+05, - "cpu_time": 8.3475497124998912e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2273050814942156e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3746025590007781e+05, - "cpu_time": 8.3478375099999621e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2272452038327898e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3744153557781840e+05, - "cpu_time": 8.3477044312500593e+05, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.2272975205494490e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9902303897548117e+02, - "cpu_time": 2.1557842757120844e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5848334045982444e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5495113279717206e-04, - "cpu_time": 2.5824463798314806e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5507070528011363e-04, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 725, - "real_time": 9.5729840550057834e+05, - "cpu_time": 1.7339409310345044e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1216375352035945e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 725, - "real_time": 9.5656264565307007e+05, - "cpu_time": 1.7332407489655076e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1225002658000813e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 725, - "real_time": 9.6004977709902765e+05, - "cpu_time": 1.7366328620689807e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1184230751498264e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 725, - "real_time": 9.5958656808040256e+05, - "cpu_time": 1.7361525131034262e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1189629572952009e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 725, - "real_time": 9.6113647872196708e+05, - "cpu_time": 1.7378182441379507e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1171585386372656e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5892677501100919e+05, - "cpu_time": 1.7355570598620740e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1197364744171938e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5958656808040256e+05, - "cpu_time": 1.7361525131034262e+06, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1189629572952009e+12, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9248341459696992e+03, - "cpu_time": 1.9106306443146609e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2484257926169715e+09, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0072795922791921e-03, - "cpu_time": 1.1008745771035036e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0079954917850145e-03, - "own_gpu": NaN, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 56922, - "real_time": 1.2300657580502449e+04, - "cpu_time": 3.1282197761849366e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3299032780918115e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 56922, - "real_time": 1.2299881556696637e+04, - "cpu_time": 3.1268270159165080e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3301133682624316e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 56922, - "real_time": 1.2299486314620826e+04, - "cpu_time": 3.1301072274340670e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3302203809365135e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 56922, - "real_time": 1.2294069100573473e+04, - "cpu_time": 3.1307357208109610e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3316877971744406e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 56922, - "real_time": 1.2298648397656983e+04, - "cpu_time": 3.1298715329749917e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3304472715719956e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2298548590010078e+04, - "cpu_time": 3.1291522546642933e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3304744192074394e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2299486314620826e+04, - "cpu_time": 3.1298715329749917e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 3.3302203809365135e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6067103617836533e+00, - "cpu_time": 1.5978853732054684e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0606629575415936e+04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1195268227838240e-04, - "cpu_time": 5.1064481468540604e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1200171713739918e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 56901, - "real_time": 1.2304476891892726e+04, - "cpu_time": 3.1267631570622769e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6577393512743413e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 56901, - "real_time": 1.2300647544873444e+04, - "cpu_time": 3.1287427936240176e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6598119896656907e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 56901, - "real_time": 1.2297120564843020e+04, - "cpu_time": 3.1302017433788471e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6617221135658395e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 56901, - "real_time": 1.2296963343129175e+04, - "cpu_time": 3.1274065833640656e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6618072864120638e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 56901, - "real_time": 1.2303546946435121e+04, - "cpu_time": 3.1263026168257067e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6582425666881239e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2300551058234696e+04, - "cpu_time": 3.1278833788509830e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6598646615212119e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2300647544873445e+04, - "cpu_time": 3.1274065833640652e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 6.6598119896656907e+08, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5013144046292530e+00, - "cpu_time": 1.5885879896782871e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8957075977059331e+05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8464695508785938e-04, - "cpu_time": 5.0787954577189169e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8464656476561573e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 56915, - "real_time": 1.2296919443697565e+04, - "cpu_time": 3.1469531160502444e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3323662137509692e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 56915, - "real_time": 1.2294805362533842e+04, - "cpu_time": 3.1487146745146259e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3325953129707305e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 56915, - "real_time": 1.2295727512195619e+04, - "cpu_time": 3.1535781569006467e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3324953715629592e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 56915, - "real_time": 1.2296609966228860e+04, - "cpu_time": 3.1528611490819636e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3323997463525848e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 56915, - "real_time": 1.2296419715453711e+04, - "cpu_time": 3.1497936712641720e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3324203613031492e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2296096400021921e+04, - "cpu_time": 3.1503801535623312e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3324554011880786e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2296419715453709e+04, - "cpu_time": 3.1497936712641724e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.3324203613031492e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4388091803414844e-01, - "cpu_time": 2.7948583219795001e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1450244395518152e+04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8629985532046091e-05, - "cpu_time": 8.8714954568869405e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8632874551731262e-05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 56875, - "real_time": 1.2308277073172356e+04, - "cpu_time": 3.1773206821977648e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6622735095411954e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 56875, - "real_time": 1.2303888735202767e+04, - "cpu_time": 3.1760486189011150e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6632230431544123e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 56875, - "real_time": 1.2306038428761274e+04, - "cpu_time": 3.1843311068131607e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6627578151727276e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 56875, - "real_time": 1.2303404902539134e+04, - "cpu_time": 3.1811949397801935e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6633277746745906e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 56875, - "real_time": 1.2305950639855148e+04, - "cpu_time": 3.1798173046153959e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6627768109092393e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2305511955906137e+04, - "cpu_time": 3.1797425304615259e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6628717906904335e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2305950639855148e+04, - "cpu_time": 3.1798173046153963e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 2.6627768109092393e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9487181724374707e+00, - "cpu_time": 3.2665137595481923e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2167866438794363e+05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5836140580093190e-04, - "cpu_time": 1.0272887594688592e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5835485052722353e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 56856, - "real_time": 1.2311782890277755e+04, - "cpu_time": 3.2433418407907782e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3230308383485069e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 56856, - "real_time": 1.2311622117749497e+04, - "cpu_time": 3.2445721630083299e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3231003496702232e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 56856, - "real_time": 1.2312362218407210e+04, - "cpu_time": 3.2467277472914182e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3227803761346836e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 56856, - "real_time": 1.2314124051181219e+04, - "cpu_time": 3.2448877972421866e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3220188238816338e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 56856, - "real_time": 1.2314363478348865e+04, - "cpu_time": 3.2435756050372980e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3219153483024530e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2312850951192911e+04, - "cpu_time": 3.2446210306740024e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3225691472675009e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2312362218407212e+04, - "cpu_time": 3.2445721630083299e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 5.3227803761346836e+09, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3036647767062060e+00, - "cpu_time": 1.3454598534673440e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6352932189904724e+05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0587838526380460e-04, - "cpu_time": 4.1467396060977039e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0587543464575782e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 56832, - "real_time": 1.2320036524637768e+04, - "cpu_time": 3.3851581802505731e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0638929498129372e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 56832, - "real_time": 1.2316519972335163e+04, - "cpu_time": 3.3866382196649713e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0641967073037537e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 56832, - "real_time": 1.2321398960215536e+04, - "cpu_time": 3.3869304546734362e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0637753101187397e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 56832, - "real_time": 1.2317928490418113e+04, - "cpu_time": 3.3895798493806113e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0640750196103062e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 56832, - "real_time": 1.2319333045512964e+04, - "cpu_time": 3.3855213172156153e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0639537020045090e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2319043398623908e+04, - "cpu_time": 3.3867656042370414e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0639787377700493e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2319333045512964e+04, - "cpu_time": 3.3866382196649720e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.0639537020045090e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8861048247832908e+00, - "cpu_time": 1.7389249761764223e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6290340798399523e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5310481209880120e-04, - "cpu_time": 5.1344709949839031e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5310776635012275e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 55766, - "real_time": 1.2553679625436755e+04, - "cpu_time": 3.5782600527203256e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0881845627861458e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 55766, - "real_time": 1.2551579026262518e+04, - "cpu_time": 3.5794911953519892e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0885340358491821e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 55766, - "real_time": 1.2550233080993901e+04, - "cpu_time": 3.5795592852275615e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0887580199366287e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 55766, - "real_time": 1.2547462415145366e+04, - "cpu_time": 3.5811149230713891e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0892192486950993e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 55766, - "real_time": 1.2548574851049752e+04, - "cpu_time": 3.5767461320517730e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0890340386188976e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2550305799777660e+04, - "cpu_time": 3.5790343176846080e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0887459811771912e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2550233080993903e+04, - "cpu_time": 3.5794911953519892e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.0887580199366287e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4540839917514603e+00, - "cpu_time": 1.6316040132882787e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0841632870001658e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9553977655229217e-04, - "cpu_time": 4.5587828125208244e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9553183220002570e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 44400, - "real_time": 1.5776501037540944e+04, - "cpu_time": 3.9056301914414405e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3232210282396042e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 44400, - "real_time": 1.5764169656371825e+04, - "cpu_time": 3.9062361689189187e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3258205882609520e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 44400, - "real_time": 1.5767283575585041e+04, - "cpu_time": 3.9072668626125953e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3251637638574432e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 44400, - "real_time": 1.5771456236249120e+04, - "cpu_time": 3.9057836981982320e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3242840239126194e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 44400, - "real_time": 1.5773293535091994e+04, - "cpu_time": 3.9055280382882527e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3238968059117031e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5770540808167785e+04, - "cpu_time": 3.9060889918918881e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3244772420364643e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5771456236249122e+04, - "cpu_time": 3.9057836981982320e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3242840239126194e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8770120874113916e+00, - "cpu_time": 7.1193601384426630e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0281298241447916e+07, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0924824625453031e-04, - "cpu_time": 1.8226313207970327e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0926059927394585e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 36315, - "real_time": 1.9280883573274412e+04, - "cpu_time": 4.2983594107118202e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4384229644612885e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 36315, - "real_time": 1.9280130850915521e+04, - "cpu_time": 4.2992932286933494e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4386352878419823e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 36315, - "real_time": 1.9282981989704225e+04, - "cpu_time": 4.2978527220156764e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4378311433359573e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 36315, - "real_time": 1.9274829419246940e+04, - "cpu_time": 4.2994941869750277e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4401311533939751e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 36315, - "real_time": 1.9281489499857515e+04, - "cpu_time": 4.2997780173482060e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4382520603906082e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9280063066599723e+04, - "cpu_time": 4.2989555131488160e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4386545218847626e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9280883573274412e+04, - "cpu_time": 4.2992932286933486e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 5.4384229644612885e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1073990117898886e+00, - "cpu_time": 8.1428202009170523e+00, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7669220429338831e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6117162070766592e-04, - "cpu_time": 1.8941392103294309e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6119652402366076e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26674, - "real_time": 2.6186057183759873e+04, - "cpu_time": 5.0779389480393082e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 8.0086589030311005e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26674, - "real_time": 2.6290045239334417e+04, - "cpu_time": 5.0894681450101365e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 7.9769813285155594e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26674, - "real_time": 2.6148578833698321e+04, - "cpu_time": 5.0764248969033761e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 8.0201375888824539e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26674, - "real_time": 2.6244038067757894e+04, - "cpu_time": 5.0900268538652657e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 7.9909653940658447e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26674, - "real_time": 2.6288425652262813e+04, - "cpu_time": 5.0885634363049474e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 7.9774727773379791e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6231428995362669e+04, - "cpu_time": 5.0844844560246078e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 7.9948431983665878e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6244038067757891e+04, - "cpu_time": 5.0885634363049474e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 7.9909653940658447e+10, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.2781809142398856e+01, - "cpu_time": 6.7080842621425205e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9147422636238852e+08, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3933812051755840e-03, - "cpu_time": 1.3193243720499744e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3949716287307334e-03, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19026, - "real_time": 3.6744757588074812e+04, - "cpu_time": 6.2587861295069488e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1414700423445505e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19026, - "real_time": 3.6794980305788296e+04, - "cpu_time": 6.2623148270788006e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1399120111338081e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19026, - "real_time": 3.6743623295308578e+04, - "cpu_time": 6.2664120676968269e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1415052800564522e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19026, - "real_time": 3.6788420855232340e+04, - "cpu_time": 6.2645821927887278e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1401152597729547e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19026, - "real_time": 3.6749350465953146e+04, - "cpu_time": 6.2604313360663749e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1413273831562982e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6764226502071440e+04, - "cpu_time": 6.2625053106275365e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1408659952928128e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6749350465953146e+04, - "cpu_time": 6.2623148270788006e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 1.1413273831562982e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5278401643746836e+01, - "cpu_time": 3.0718948962904371e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8423947334830835e+07, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8758149018374021e-04, - "cpu_time": 4.9052172316363548e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8740717716547133e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10850, - "real_time": 6.4472362432899252e+04, - "cpu_time": 9.2122898156681782e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.3011168946586363e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10850, - "real_time": 6.4518386955439521e+04, - "cpu_time": 9.2221278064516388e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.3001887362425388e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10850, - "real_time": 6.4475562480199987e+04, - "cpu_time": 9.2170800921655304e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.3010523177019333e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10850, - "real_time": 6.4507238986668039e+04, - "cpu_time": 9.2217466359448517e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.3004134313877094e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10850, - "real_time": 6.4463573769496732e+04, - "cpu_time": 9.2178149216590711e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.3012942828759787e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4487424924940708e+04, - "cpu_time": 9.2182118543778561e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.3008131325733592e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4475562480199987e+04, - "cpu_time": 9.2178149216590711e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 1.3010523177019333e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3915048863435985e+01, - "cpu_time": 4.0105593455866497e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8234281396261729e+07, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7084825283800049e-04, - "cpu_time": 4.3506912283448776e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7080100276079862e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5812, - "real_time": 1.2048575350310592e+05, - "cpu_time": 1.5413840020646711e+05, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.3924647115700290e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5812, - "real_time": 1.2045470331517895e+05, - "cpu_time": 1.5417537577425479e+05, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.3928236538926279e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5812, - "real_time": 1.2048030386343208e+05, - "cpu_time": 1.5418375705436885e+05, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.3925276963957080e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5812, - "real_time": 1.2047168761733940e+05, - "cpu_time": 1.5411403750860205e+05, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.3926272912595331e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5812, - "real_time": 1.2048974828801409e+05, - "cpu_time": 1.5421289108741039e+05, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.3924185450115128e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2047643931741412e+05, - "cpu_time": 1.5416489232622067e+05, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.3925723796258823e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2048030386343210e+05, - "cpu_time": 1.5417537577425479e+05, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.3925276963957080e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3909078874616574e+01, - "cpu_time": 3.8915635076111350e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6078567444247015e+07, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1545061385795874e-04, - "cpu_time": 2.5242864629492889e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1545947398846556e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3051, - "real_time": 2.2935484691498749e+05, - "cpu_time": 2.7449511373320542e+05, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.4629920601781424e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3051, - "real_time": 2.2940387679123535e+05, - "cpu_time": 2.7457263389052887e+05, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.4626793788029825e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3051, - "real_time": 2.2939837064890278e+05, - "cpu_time": 2.7458143788921152e+05, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.4627144868154056e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3051, - "real_time": 2.2941357902196542e+05, - "cpu_time": 2.7454684627992066e+05, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.4626175199850439e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3051, - "real_time": 2.2937613453545709e+05, - "cpu_time": 2.7451998525072931e+05, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.4628562848509045e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2938936158250962e+05, - "cpu_time": 2.7454320340871916e+05, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.4627719461264960e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2939837064890278e+05, - "cpu_time": 2.7454684627992060e+05, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 1.4627144868154056e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3688372522091875e+01, - "cpu_time": 3.6031232774985085e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5106366990124395e+07, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0326709294045158e-04, - "cpu_time": 1.3124066568621080e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0327219516430378e-04, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1560, - "real_time": 4.4872205966011959e+05, - "cpu_time": 5.1778271089743520e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.4955552675709991e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1560, - "real_time": 4.4873980786621524e+05, - "cpu_time": 5.1768272820512409e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.4954961165381491e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1560, - "real_time": 4.4870903793474636e+05, - "cpu_time": 5.1773759999998118e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.4955986692151123e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1560, - "real_time": 4.4868585706960101e+05, - "cpu_time": 5.1775606410255173e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.4956759376881796e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1560, - "real_time": 4.4866667413794529e+05, - "cpu_time": 5.1775746410254005e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.4957398859396222e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4870468733372557e+05, - "cpu_time": 5.1774331346152647e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.4956131753904126e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4870903793474630e+05, - "cpu_time": 5.1775606410255173e+05, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 1.4955986692151123e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8955824735049656e+01, - "cpu_time": 3.7477307437209639e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6515786281167492e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.4532030871149941e-05, - "cpu_time": 7.2385884013921858e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4532586279184893e-05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 788, - "real_time": 8.8868429020063742e+05, - "cpu_time": 1.0051852753807299e+06, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.5102970703994080e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 788, - "real_time": 8.8885527025544224e+05, - "cpu_time": 1.0051963870558565e+06, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.5100065499012912e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 788, - "real_time": 8.8874420087883796e+05, - "cpu_time": 1.0052077918781929e+06, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.5101952605404153e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 788, - "real_time": 8.8877609239827341e+05, - "cpu_time": 1.0052341878172269e+06, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.5101410709397781e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 788, - "real_time": 8.8866338522946415e+05, - "cpu_time": 1.0051310253806731e+06, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.5103325987189545e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8874464779253094e+05, - "cpu_time": 1.0051909335025357e+06, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.5101945100999692e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8874420087883808e+05, - "cpu_time": 1.0051963870558564e+06, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.5101952605404153e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6604397656691006e+01, - "cpu_time": 3.8098161876130753e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3016569263421142e+07, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.6193934159785299e-05, - "cpu_time": 3.7901418134940465e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6191342746700191e-05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 396, - "real_time": 1.7692914248486473e+06, - "cpu_time": 1.9817555707070865e+06, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.5171918669247104e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 396, - "real_time": 1.7691164843695748e+06, - "cpu_time": 1.9814497954544979e+06, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.5173418956392636e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 396, - "real_time": 1.7692001084938194e+06, - "cpu_time": 1.9816395202020153e+06, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.5172701760035968e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 396, - "real_time": 1.7690736523504846e+06, - "cpu_time": 1.9815099090908919e+06, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.5173786328417838e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 396, - "real_time": 1.7693071838378944e+06, - "cpu_time": 1.9817830984848540e+06, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.5171783534938403e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7691977707800840e+06, - "cpu_time": 1.9816275787878695e+06, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.5172721849806390e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7692001084938194e+06, - "cpu_time": 1.9816395202020151e+06, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 1.5172701760035968e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0339322123828056e+02, - "cpu_time": 1.4676850112834961e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8670873398833741e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8440736782463778e-05, - "cpu_time": 7.4064623796831492e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8440979988020552e-05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 198, - "real_time": 3.5304365423272806e+06, - "cpu_time": 3.9470013888887358e+06, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.5206927119729282e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 198, - "real_time": 3.5303177693012087e+06, - "cpu_time": 3.9464299646464377e+06, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.5207438737342566e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 198, - "real_time": 3.5305626224726439e+06, - "cpu_time": 3.9472768535354203e+06, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.5206384064192020e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 198, - "real_time": 3.5303888684891239e+06, - "cpu_time": 3.9467672121211514e+06, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.5207132471776712e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 198, - "real_time": 3.5303751314811483e+06, - "cpu_time": 3.9474483383839191e+06, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.5207191644100409e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5304161868142812e+06, - "cpu_time": 3.9469847515151338e+06, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.5207014807428198e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5303888684891239e+06, - "cpu_time": 3.9470013888887363e+06, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 1.5207132471776712e+11, - "own_gpu": 1.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2162321938911788e+01, - "cpu_time": 4.0485337216668364e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9697569271682114e+06, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_implicit_mapped_GPUWrGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6105228693185799e-05, - "cpu_time": 1.0257282397943699e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6104774523064824e-05, - "own_gpu": 0.0000000000000000e+00, - "wr_gpu": NaN - } \ No newline at end of file diff --git a/results/implicit_mapped_HostWrGPU.json b/results/implicit_mapped_HostWrGPU.json deleted file mode 100644 index 098fda7..0000000 --- a/results/implicit_mapped_HostWrGPU.json +++ /dev/null @@ -1,38 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:41:39-04:00", - "host_name": "frontier06647", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1798, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [1.31,5.45,4.52], - "library_build_type": "release" - }, - "benchmarks": [ diff --git a/results/prefetch_managed_GPUToGPU.json b/results/prefetch_managed_GPUToGPU.json deleted file mode 100644 index eaa1899..0000000 --- a/results/prefetch_managed_GPUToGPU.json +++ /dev/null @@ -1,27928 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:09:31-04:00", - "host_name": "frontier07514", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1796, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [0.81,11.68,31.57], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 79043, - "real_time": 8.9134698092958333e+03, - "cpu_time": 2.1045625887175331e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1488230979725461e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 79043, - "real_time": 8.9102897982250197e+03, - "cpu_time": 2.1000491403413336e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1492331037358478e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 79043, - "real_time": 8.9054022328977499e+03, - "cpu_time": 2.0981241046012925e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1498638390719812e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 79043, - "real_time": 8.9602867057645126e+03, - "cpu_time": 2.1085640094632028e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1428205744144544e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 79043, - "real_time": 9.0213297776129184e+03, - "cpu_time": 2.1216919841099145e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1350876480994299e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9421556647592079e+03, - "cpu_time": 2.1065983654466552e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1451656526588519e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9134698092958351e+03, - "cpu_time": 2.1045625887175331e+04, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.1488230979725461e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9463120861198988e+01, - "cpu_time": 9.3612354153091957e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3059414033909317e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.5314537920796662e-03, - "cpu_time": 4.4437684794862934e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5065757419022849e-03, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 75911, - "real_time": 9.3211313289398695e+03, - "cpu_time": 2.1601203093095868e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.1971581857681298e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 75911, - "real_time": 9.2110138695324949e+03, - "cpu_time": 2.1507746637509732e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.2234251614517936e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 75911, - "real_time": 8.9384880996791271e+03, - "cpu_time": 2.1194600281909101e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.2912152224865845e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 75911, - "real_time": 8.9211151927016872e+03, - "cpu_time": 2.1168430003556779e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.2956771163267311e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 75911, - "real_time": 8.9306596332770096e+03, - "cpu_time": 2.1192519911475305e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.2932236633101967e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0644816248260377e+03, - "cpu_time": 2.1332899985509361e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.2601398698686874e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9384880996791289e+03, - "cpu_time": 2.1194600281909101e+04, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.2912152224865845e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8820029026386112e+02, - "cpu_time": 2.0520822194879480e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6469810524952644e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0762388634382938e-02, - "cpu_time": 9.6193308030406120e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0560590583118429e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 77064, - "real_time": 9.1130991840211154e+03, - "cpu_time": 2.1471712394892576e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.4946290140042764e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 77064, - "real_time": 9.0926277494848564e+03, - "cpu_time": 2.1411010264195993e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.5047483663147426e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 77064, - "real_time": 8.8304681139009263e+03, - "cpu_time": 2.1052866487594696e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.6384856920009434e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 77064, - "real_time": 8.8879375324511584e+03, - "cpu_time": 2.1020667237620681e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.6084932359671813e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 77064, - "real_time": 8.9279207438885223e+03, - "cpu_time": 2.1077142271358858e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.5878543476137567e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9704106647493154e+03, - "cpu_time": 2.1206679731132561e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.5668421311801797e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9279207438885205e+03, - "cpu_time": 2.1077142271358858e+04, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 4.5878543476137567e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2598428254840817e+02, - "cpu_time": 2.1623621037878326e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3991205458156513e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4044427535908011e-02, - "cpu_time": 1.0196608479984571e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4012134341420660e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 75917, - "real_time": 9.2591456870714337e+03, - "cpu_time": 2.1481177917989371e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 8.8474685212465215e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 75917, - "real_time": 9.2640701804632154e+03, - "cpu_time": 2.1497017242514834e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 8.8427654804212534e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 75917, - "real_time": 9.1425555907851322e+03, - "cpu_time": 2.1389614565907483e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 8.9602955307778430e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 75917, - "real_time": 8.9496936989932474e+03, - "cpu_time": 2.1144024171134250e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.1533858872974837e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 75917, - "real_time": 8.9375545592537910e+03, - "cpu_time": 2.1152064992030831e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 9.1658181728447676e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1106039433133665e+03, - "cpu_time": 2.1332779777915355e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 8.9939467185175753e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1425555907851340e+03, - "cpu_time": 2.1389614565907483e+04, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 8.9602955307778430e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6005908238070361e+02, - "cpu_time": 1.7357466607377256e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5843348511134885e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7568438204162890e-02, - "cpu_time": 8.1365235979918953e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7615568567373348e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 76993, - "real_time": 9.1370141230202389e+03, - "cpu_time": 2.1480745756107739e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.7931459642512045e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 76993, - "real_time": 9.1480151724087591e+03, - "cpu_time": 2.1475195784032319e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.7909895962367470e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 76993, - "real_time": 9.0935004719521730e+03, - "cpu_time": 2.1413125998467334e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.8017264144357295e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 76993, - "real_time": 8.9264805996291234e+03, - "cpu_time": 2.1125912563479778e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.8354378096873610e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 76993, - "real_time": 8.8845060499330139e+03, - "cpu_time": 2.1047713519410790e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.8441092738209720e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0379032833886631e+03, - "cpu_time": 2.1308538724299593e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.8130818116864030e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0935004719521712e+03, - "cpu_time": 2.1413125998467334e+04, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.8017264144357295e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2347505790661239e+02, - "cpu_time": 2.0600390615359498e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4884448438139029e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3661914056278411e-02, - "cpu_time": 9.6676693235033789e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3724945161185661e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 76438, - "real_time": 9.0888815704584613e+03, - "cpu_time": 2.1425251458698564e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6052840765915184e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 76438, - "real_time": 9.0211171532364133e+03, - "cpu_time": 2.1345552931787930e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6323660854181633e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 76438, - "real_time": 8.8624902854353550e+03, - "cpu_time": 2.1106619574033884e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6973806395986733e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 76438, - "real_time": 8.8455823385196927e+03, - "cpu_time": 2.1008789829665919e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.7044480222976165e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 76438, - "real_time": 8.8934221334089852e+03, - "cpu_time": 2.1084854103979738e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6845209311389694e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9422986962117830e+03, - "cpu_time": 2.1194213579633208e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6647999510089884e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8934221334089852e+03, - "cpu_time": 2.1106619574033884e+04, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.6845209311389694e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0701780559487399e+02, - "cpu_time": 1.8048287512784233e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3636231585723348e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1967594600727197e-02, - "cpu_time": 8.5156674697889796e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1906852261802032e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 75351, - "real_time": 9.2260434635517558e+03, - "cpu_time": 2.1610926610131235e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.1033699612304401e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 75351, - "real_time": 9.1675534559580828e+03, - "cpu_time": 2.1502981340659102e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.1486902492406530e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 75351, - "real_time": 9.0436760740528971e+03, - "cpu_time": 2.1357186102374206e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2466107214994745e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 75351, - "real_time": 8.9627489409785085e+03, - "cpu_time": 2.1193276691749332e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3120423690954237e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 75351, - "real_time": 8.9407943439522205e+03, - "cpu_time": 2.1150312816021011e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3299974788403683e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0681632556986933e+03, - "cpu_time": 2.1362936712186976e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2281421559812717e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0436760740528971e+03, - "cpu_time": 2.1357186102374202e+04, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2466107214994745e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2523898298015322e+02, - "cpu_time": 1.9693780789577244e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9543390708928540e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3810843436398153e-02, - "cpu_time": 9.2186673840317455e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3771642638012675e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 76097, - "real_time": 9.1860158183993317e+03, - "cpu_time": 2.1534922335965945e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4268645144009710e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 76097, - "real_time": 9.2413267897695659e+03, - "cpu_time": 2.1602049502608523e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4183244785272690e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 76097, - "real_time": 8.9935332377289506e+03, - "cpu_time": 2.1261194094379611e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4574027418961132e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 76097, - "real_time": 8.9239130027200245e+03, - "cpu_time": 2.1107404168364032e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4687727229080900e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 76097, - "real_time": 8.8751261818576786e+03, - "cpu_time": 2.1065765444104200e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4768466083100233e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0439830060951099e+03, - "cpu_time": 2.1314267109084460e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4496422132084934e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9935332377289487e+03, - "cpu_time": 2.1261194094379607e+04, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4574027418961132e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6170381926229800e+02, - "cpu_time": 2.4437140473251984e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5816203188343990e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7879712860287240e-02, - "cpu_time": 1.1465156342549779e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7808672342125704e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 76462, - "real_time": 9.2155771671799594e+03, - "cpu_time": 2.1553928055766100e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.8445749543890820e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 76462, - "real_time": 9.2112396125229097e+03, - "cpu_time": 2.1550738785278929e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.8459144591528011e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 76462, - "real_time": 9.0936856963223418e+03, - "cpu_time": 2.1401143849232303e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.8827035456703323e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 76462, - "real_time": 9.1218200373881191e+03, - "cpu_time": 2.1431248934111092e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.8738124510847130e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 76462, - "real_time": 9.0471987313963837e+03, - "cpu_time": 2.1357323533258259e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.8975156596293709e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1379042489619442e+03, - "cpu_time": 2.1458876631529340e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.8689042139852600e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1218200373881209e+03, - "cpu_time": 2.1431248934111096e+04, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.8738124510847130e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3913177020927819e+01, - "cpu_time": 8.9278810651181587e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3203280306753871e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0886355347096432e-03, - "cpu_time": 4.1604605955935740e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0878546567163586e-03, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 73903, - "real_time": 9.4377874698665219e+03, - "cpu_time": 2.1837400714449992e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 5.5552003228932098e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 73903, - "real_time": 9.4575323164702295e+03, - "cpu_time": 2.1881848098182712e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 5.5436025218434204e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 73903, - "real_time": 9.1913992827472393e+03, - "cpu_time": 2.1569630650988427e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 5.7041151610518913e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 73903, - "real_time": 9.1600937573789615e+03, - "cpu_time": 2.1463518503985055e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 5.7236095381409935e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 73903, - "real_time": 9.1313316892192906e+03, - "cpu_time": 2.1427902602059447e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 5.7416378885786102e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2756289031364468e+03, - "cpu_time": 2.1636060113933127e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 5.6536330865016266e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1913992827472375e+03, - "cpu_time": 2.1569630650988423e+04, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 5.7041151610518913e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5862608340587207e+02, - "cpu_time": 2.1122428901388986e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6158362785113621e+08, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7101383104301905e-02, - "cpu_time": 9.7626040925014000e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7008242543135179e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 74610, - "real_time": 9.3935084101492084e+03, - "cpu_time": 2.1800549765447027e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.1162772781116234e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 74610, - "real_time": 9.3386104167535013e+03, - "cpu_time": 2.1753407612920601e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.1228394302848857e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 74610, - "real_time": 8.9188169825446475e+03, - "cpu_time": 2.1293061064200476e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.1756895584383080e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 74610, - "real_time": 8.9626259552551583e+03, - "cpu_time": 2.1230890885940138e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.1699428328649335e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 74610, - "real_time": 8.8653477039657100e+03, - "cpu_time": 2.1087615024795581e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.1827804560118309e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0957818937336451e+03, - "cpu_time": 2.1433104870660765e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.1535059111423163e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9626259552551583e+03, - "cpu_time": 2.1293061064200476e+04, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.1699428328649335e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4987685453399240e+02, - "cpu_time": 3.2306175661317309e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1407362774911757e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7471728923726717e-02, - "cpu_time": 1.5073026449630458e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7227743240439108e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 76700, - "real_time": 9.3139363590888333e+03, - "cpu_time": 2.1741541408083369e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2516280111292935e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 76700, - "real_time": 9.2581521958728790e+03, - "cpu_time": 2.1686834263363820e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2651949931595132e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 76700, - "real_time": 9.2698756723898514e+03, - "cpu_time": 2.1631409739243805e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2623302341004715e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 76700, - "real_time": 8.8901922587344998e+03, - "cpu_time": 2.1139503441981673e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3589501092505341e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 76700, - "real_time": 8.8678418709169091e+03, - "cpu_time": 2.1113472920469510e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3648955749626605e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1199996714005956e+03, - "cpu_time": 2.1462552354628435e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.3005997845204947e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2581521958728790e+03, - "cpu_time": 2.1631409739243805e+04, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.2651949931595132e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2110821885621493e+02, - "cpu_time": 3.0938129152709217e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6247225252515287e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4244323116544418e-02, - "cpu_time": 1.4414934739128247e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4448939633469835e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 75086, - "real_time": 9.2435394845660685e+03, - "cpu_time": 2.1672367844871093e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 4.5375518836731604e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 75086, - "real_time": 9.2052987365141398e+03, - "cpu_time": 2.1608552007032053e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 4.5564018290494916e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 75086, - "real_time": 8.8818262535789363e+03, - "cpu_time": 2.1201390072716615e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 4.7223441218633417e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 75086, - "real_time": 9.0394178814079060e+03, - "cpu_time": 2.1378716897957103e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 4.6400156016979370e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 75086, - "real_time": 8.9872835383634156e+03, - "cpu_time": 2.1331208187944507e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 4.6669318733475525e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0714731788860954e+03, - "cpu_time": 2.1438447002104276e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 4.6246490619262970e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0394178814079078e+03, - "cpu_time": 2.1378716897957107e+04, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 4.6400156016979370e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5132538400006783e+02, - "cpu_time": 1.9679844369098726e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7155516130289545e+09, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6681456365023328e-02, - "cpu_time": 9.1796968162698826e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6683539679906455e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 74801, - "real_time": 9.3497294695090968e+03, - "cpu_time": 2.1751469873397553e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 8.9720328565190454e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 74801, - "real_time": 9.3546087399650714e+03, - "cpu_time": 2.1732284073742470e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 8.9673531338215234e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 74801, - "real_time": 8.9671217409553210e+03, - "cpu_time": 2.1299687972085885e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 9.3548501317729529e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 74801, - "real_time": 8.9858838412582354e+03, - "cpu_time": 2.1237046643761616e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 9.3353176473126965e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 74801, - "real_time": 8.9750136691855605e+03, - "cpu_time": 2.1206318324621319e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 9.3466242049314075e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1264714921746599e+03, - "cpu_time": 2.1445361377521771e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 9.1952355948715259e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9858838412582354e+03, - "cpu_time": 2.1299687972085885e+04, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 9.3353176473126965e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0614766019851950e+02, - "cpu_time": 2.7284812412150524e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0601466666506802e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2587881896664816e-02, - "cpu_time": 1.2722943638874487e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2404501172321123e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 74651, - "real_time": 9.3676361840978334e+03, - "cpu_time": 2.1803767143105819e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.7909764715756580e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 74651, - "real_time": 9.4387242169704841e+03, - "cpu_time": 2.1889196179555413e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.7774876788788018e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 74651, - "real_time": 8.9434136146422061e+03, - "cpu_time": 2.1295656119810756e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.8759297873165845e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 74651, - "real_time": 9.0868441855465462e+03, - "cpu_time": 2.1470584466383549e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.8463193224646345e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 74651, - "real_time": 9.0828666981214483e+03, - "cpu_time": 2.1454558920845138e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.8471278460433560e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1838969798757043e+03, - "cpu_time": 2.1582752565940136e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.8275682212558071e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0868441855465462e+03, - "cpu_time": 2.1470584466383552e+04, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 1.8463193224646345e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0985448982919192e+02, - "cpu_time": 2.5208867201159123e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1593390880203926e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2850266100440525e-02, - "cpu_time": 1.1680098321166585e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2758871814712981e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 76838, - "real_time": 9.2629069428103630e+03, - "cpu_time": 2.1691464301517517e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6224515918346899e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 76838, - "real_time": 9.2265503709535005e+03, - "cpu_time": 2.1628740375855465e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6367256071818726e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 76838, - "real_time": 8.9135045687898000e+03, - "cpu_time": 2.1253445560790205e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.7644488473691030e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 76838, - "real_time": 9.0536022086682970e+03, - "cpu_time": 2.1363284117233627e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.7061968514447856e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 76838, - "real_time": 9.0239508617382508e+03, - "cpu_time": 2.1346872393867357e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.7183748575439971e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0961029905920423e+03, - "cpu_time": 2.1456761349852834e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.6896395510748901e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0536022086682970e+03, - "cpu_time": 2.1363284117233627e+04, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.7061968514447856e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4594049071936314e+02, - "cpu_time": 1.9158101853548393e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9182768122601944e+10, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6044287413006109e-02, - "cpu_time": 8.9287015599303354e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6040257402748306e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 76644, - "real_time": 9.2207878371688275e+03, - "cpu_time": 2.1730249438964700e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2779967596136846e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 76644, - "real_time": 9.2324129939138911e+03, - "cpu_time": 2.1770814871352934e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2688325407711826e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 76644, - "real_time": 8.9685642486665874e+03, - "cpu_time": 2.1470359728093514e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4826763949399697e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 76644, - "real_time": 8.8198585309909267e+03, - "cpu_time": 2.1180358893064022e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.6088367817006465e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 76644, - "real_time": 8.7990412468577415e+03, - "cpu_time": 2.1144737591983951e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.6268382108068301e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0081329715195952e+03, - "cpu_time": 2.1459304104691822e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4530361375664629e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9685642486665874e+03, - "cpu_time": 2.1470359728093514e+04, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4826763949399697e+12, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0991421964467023e+02, - "cpu_time": 2.9467570341227827e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7315404640007593e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3302744343177639e-02, - "cpu_time": 1.3731838738789805e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3232685740956775e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 77890, - "real_time": 9.1046186068304687e+03, - "cpu_time": 2.1653455681088501e+04, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.4741718878735586e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 77890, - "real_time": 9.1538740351458237e+03, - "cpu_time": 2.1730257388625123e+04, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.4662396214398189e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 77890, - "real_time": 8.9232244754090480e+03, - "cpu_time": 2.1501390345358777e+04, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.5041393205996574e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 77890, - "real_time": 9.0576972795270049e+03, - "cpu_time": 2.1602925972525492e+04, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.4818084978769449e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 77890, - "real_time": 9.0106929205533797e+03, - "cpu_time": 2.1544804442162214e+04, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.4895383649558129e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0500214634931453e+03, - "cpu_time": 2.1606566765952022e+04, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.4831795385491586e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0576972795270049e+03, - "cpu_time": 2.1602925972525496e+04, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 1.4818084978769449e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8669799436134184e+01, - "cpu_time": 8.9983137260652626e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4575025315289706e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.7977446566087176e-03, - "cpu_time": 4.1646198692912896e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.8268786323380299e-03, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 77035, - "real_time": 9.1619056646224908e+03, - "cpu_time": 2.2018206659310705e+04, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.9299085346024539e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 77035, - "real_time": 9.2108668614352191e+03, - "cpu_time": 2.2105798338417637e+04, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.9143343404941246e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 77035, - "real_time": 9.0754073760363281e+03, - "cpu_time": 2.1958942999934879e+04, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.9578336803789719e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 77035, - "real_time": 8.9096478432512140e+03, - "cpu_time": 2.1652801648601002e+04, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0128626935949172e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 77035, - "real_time": 8.9313721281891085e+03, - "cpu_time": 2.1683286908548027e+04, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.0055343361269949e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0578399747068725e+03, - "cpu_time": 2.1883807310962449e+04, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.9640947170394926e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0754073760363281e+03, - "cpu_time": 2.1958942999934883e+04, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 2.9578336803789719e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3463889992966182e+02, - "cpu_time": 2.0405919526691696e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4100873832178345e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4864349591693792e-02, - "cpu_time": 9.3246660586659320e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4878361875097515e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 77297, - "real_time": 9.1514634663733214e+03, - "cpu_time": 2.2568332043934461e+04, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.8665033627977672e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 77297, - "real_time": 9.1277797080426262e+03, - "cpu_time": 2.2558299778775217e+04, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.8817251201511234e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 77297, - "real_time": 9.1799152462833717e+03, - "cpu_time": 2.2595089460134528e+04, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.8483210094707609e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 77297, - "real_time": 9.1643681776414251e+03, - "cpu_time": 2.2490806163240526e+04, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.8582425061208211e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 77297, - "real_time": 8.8510990455429292e+03, - "cpu_time": 2.2141466926271143e+04, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0655847283772891e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0949251287767365e+03, - "cpu_time": 2.2470798874471177e+04, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.9040753453835531e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1514634663733214e+03, - "cpu_time": 2.2558299778775217e+04, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.8665033627977672e+13, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3763431891379730e+02, - "cpu_time": 1.8806720925841410e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1112104528317029e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5133089823721182e-02, - "cpu_time": 8.3694046797808848e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5432070086903340e-02, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 75451, - "real_time": 9.2973971285494445e+03, - "cpu_time": 2.3870499635524877e+04, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1548843285427375e+14, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 75451, - "real_time": 9.1837771971508446e+03, - "cpu_time": 2.3788531709321283e+04, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1691723361201700e+14, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 75451, - "real_time": 9.2498578986970733e+03, - "cpu_time": 2.3929418417250828e+04, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1608198047574833e+14, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 75451, - "real_time": 9.3917561042221423e+03, - "cpu_time": 2.3966345363215911e+04, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1432812054364258e+14, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 75451, - "real_time": 9.2892787148443404e+03, - "cpu_time": 2.3868473287298748e+04, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1558936457403867e+14, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2824134086927697e+03, - "cpu_time": 2.3884653682522330e+04, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1568102641194406e+14, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2892787148443422e+03, - "cpu_time": 2.3870499635524880e+04, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 1.1558936457403867e+14, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5855838294168109e+01, - "cpu_time": 6.7784563394158553e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4403666007687622e+11, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.1719952510551658e-03, - "cpu_time": 2.8379964932780301e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1606871010560505e-03, - "dst_gpu": NaN, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2247, - "real_time": 2.6711041202999133e+05, - "cpu_time": 5.3776339296839596e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8336206822406636e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2247, - "real_time": 2.5931789156521577e+05, - "cpu_time": 5.2212118024032190e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9488212472315072e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2247, - "real_time": 2.5944328429836413e+05, - "cpu_time": 5.2116067868268455e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9469127241789871e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2247, - "real_time": 2.5998722875020772e+05, - "cpu_time": 5.2176541700044408e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9386550059497179e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2247, - "real_time": 2.6009845733424978e+05, - "cpu_time": 5.2193842100578698e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9369706783153596e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6119145479560579e+05, - "cpu_time": 5.2494981797952659e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9209960675832476e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5998722875020769e+05, - "cpu_time": 5.2193842100578698e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9386550059497179e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3258531923083146e+03, - "cpu_time": 7.1720881442414347e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9110584316362307e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2733392043437819e-02, - "cpu_time": 1.3662426195033278e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2525027689362667e-02, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2692, - "real_time": 2.5916551824243611e+05, - "cpu_time": 5.2106060326894734e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.9022858206167705e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2692, - "real_time": 2.5975309490253194e+05, - "cpu_time": 5.2103388112926978e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8844103889059657e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2692, - "real_time": 2.5978780594485902e+05, - "cpu_time": 5.2110761552748649e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8833569287493667e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2692, - "real_time": 2.5878965417525131e+05, - "cpu_time": 5.2080366158989840e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.9137630386611298e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2692, - "real_time": 2.5951939963077972e+05, - "cpu_time": 5.2141170728082437e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8915102412910387e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5940309457917162e+05, - "cpu_time": 5.2108349375928531e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8950652836448550e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5951939963077972e+05, - "cpu_time": 5.2106060326894728e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8915102412910387e+06, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2331476799090996e+02, - "cpu_time": 2.1771392128911967e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2893727924650879e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6318801773650827e-03, - "cpu_time": 4.1781005135751374e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6331375943605027e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2692, - "real_time": 2.5986799047898327e+05, - "cpu_time": 5.2142785921247595e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5761848900475731e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2692, - "real_time": 2.5931202889259913e+05, - "cpu_time": 5.2095143090639089e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5795642097638540e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2692, - "real_time": 2.6019660666128993e+05, - "cpu_time": 5.2182098811291397e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5741942420225158e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2692, - "real_time": 2.5947719614677416e+05, - "cpu_time": 5.2175012407130818e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5785587561548503e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2692, - "real_time": 2.6031108654595781e+05, - "cpu_time": 5.2189050965824223e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5735019412155744e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5983298174512089e+05, - "cpu_time": 5.2156818239226623e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5764008078408737e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5986799047898324e+05, - "cpu_time": 5.2175012407130812e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5761848900475731e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3589223385833884e+02, - "cpu_time": 3.8761493886160065e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6449401489270509e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6775862360919236e-03, - "cpu_time": 7.4317213347588611e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6778348093780212e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2670, - "real_time": 2.6172836229845198e+05, - "cpu_time": 5.2511065018725849e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1299626559610549e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2670, - "real_time": 2.6159490809003275e+05, - "cpu_time": 5.2484708913856826e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1315594251477446e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2670, - "real_time": 2.6120317447799770e+05, - "cpu_time": 5.2493844756555033e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1362559112734091e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2670, - "real_time": 2.6200881026413164e+05, - "cpu_time": 5.2505727977527666e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1266124187738676e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2670, - "real_time": 2.6112988726140003e+05, - "cpu_time": 5.2388495917604445e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1371361148712654e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6153302847840282e+05, - "cpu_time": 5.2476768516853976e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1323053052054688e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6159490809003272e+05, - "cpu_time": 5.2493844756555033e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1315594251477446e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6731430600674253e+02, - "cpu_time": 5.0402381004659617e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3987870142659784e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4044662280086548e-03, - "cpu_time": 9.6047036487149321e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4043289480612851e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2660, - "real_time": 2.6357245654055040e+05, - "cpu_time": 5.2972055751880340e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2161275176639475e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2660, - "real_time": 2.6457365907516849e+05, - "cpu_time": 5.3105523195488914e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1926043799186803e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2660, - "real_time": 2.6383729915474227e+05, - "cpu_time": 5.3022918458646361e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2098877044639088e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2660, - "real_time": 2.6446027402009786e+05, - "cpu_time": 5.3044936729323887e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1952594054844260e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2660, - "real_time": 2.6452300750170799e+05, - "cpu_time": 5.3029965037593769e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1937901563795768e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6419333925845340e+05, - "cpu_time": 5.3035079834586661e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2015338327821076e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6446027402009780e+05, - "cpu_time": 5.3029965037593769e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1952594054844260e+07, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5739435540945016e+02, - "cpu_time": 4.7972702343703639e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0745125651894444e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7312864763861183e-03, - "cpu_time": 9.0454662260013041e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7326561366309613e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2619, - "real_time": 2.6782412269003701e+05, - "cpu_time": 5.3800688316151325e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2234894926893364e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2619, - "real_time": 2.6858960523786762e+05, - "cpu_time": 5.3874213096600294e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2200025377370837e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2619, - "real_time": 2.6780621497758495e+05, - "cpu_time": 5.3830840473464387e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2235713051970300e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2619, - "real_time": 2.6875693798333663e+05, - "cpu_time": 5.3873770141274482e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2192429429312693e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2619, - "real_time": 2.6768722281661123e+05, - "cpu_time": 5.3767468881252082e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2241152063671303e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6813282074108755e+05, - "cpu_time": 5.3829396181748505e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2220842969843701e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6782412269003701e+05, - "cpu_time": 5.3830840473464399e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2234894926893364e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9967432653272238e+02, - "cpu_time": 4.6472632306254326e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2758172011389668e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8635328758026767e-03, - "cpu_time": 8.6333185216020336e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8622424056628506e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2541, - "real_time": 2.7705251063494728e+05, - "cpu_time": 5.5600269382132520e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3654721572385320e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2541, - "real_time": 2.7640414580835460e+05, - "cpu_time": 5.5538191774891224e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3710208762729457e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2541, - "real_time": 2.7725922978235374e+05, - "cpu_time": 5.5636023770168982e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3637085067085135e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2541, - "real_time": 2.7593237237304018e+05, - "cpu_time": 5.5574331680439378e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3750747125603721e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2541, - "real_time": 2.7690654783537163e+05, - "cpu_time": 5.5690908933491632e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3667190433850959e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7671096128681349e+05, - "cpu_time": 5.5607945108224754e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3683990592330921e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7690654783537163e+05, - "cpu_time": 5.5600269382132520e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3667190433850959e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3755112148568844e+02, - "cpu_time": 5.8578396976530553e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6051265850137064e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9426448413386549e-03, - "cpu_time": 1.0534177600435455e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9444048362799492e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2365, - "real_time": 2.9254838890478760e+05, - "cpu_time": 5.8854563340381102e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4803528226798248e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2365, - "real_time": 2.9285769936939736e+05, - "cpu_time": 5.8834698562368506e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4756207633343369e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2365, - "real_time": 2.9570861545048776e+05, - "cpu_time": 5.8902719154334115e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4324714652064693e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2365, - "real_time": 2.9255366338029050e+05, - "cpu_time": 5.8852728879492031e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4802720460081720e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2365, - "real_time": 2.9301784402714454e+05, - "cpu_time": 5.8843598224101949e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4731746776437879e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9333724222642160e+05, - "cpu_time": 5.8857661632135557e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4683783549745178e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9285769936939736e+05, - "cpu_time": 5.8852728879492043e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4756207633343369e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3408647303442085e+03, - "cpu_time": 2.6406409190464836e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0307693653293080e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5710688495162848e-03, - "cpu_time": 4.4864862888211089e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5447569655074314e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2155, - "real_time": 3.2410593958638539e+05, - "cpu_time": 6.5156258004639752e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0882195597692704e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2155, - "real_time": 3.2463353007044340e+05, - "cpu_time": 6.5194110394431022e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0750746832317793e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2155, - "real_time": 3.2366767883292143e+05, - "cpu_time": 6.5152397772620292e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0991713768034232e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2155, - "real_time": 3.2434493088295247e+05, - "cpu_time": 6.5255680000001099e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0822598116879725e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2155, - "real_time": 3.2456930434512813e+05, - "cpu_time": 6.5253259860789857e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0766725778002512e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2426427674356615e+05, - "cpu_time": 6.5202341206496407e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0842796018585396e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2434493088295247e+05, - "cpu_time": 6.5194110394431022e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0822598116879725e+08, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9271321267004430e+02, - "cpu_time": 5.0307779200613612e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7975140169330710e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2110899683859062e-03, - "cpu_time": 7.7156400015282304e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2119217171410878e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1795, - "real_time": 3.8920734476552327e+05, - "cpu_time": 7.8195216490251396e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3470660486015639e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1795, - "real_time": 3.8892513291500404e+05, - "cpu_time": 7.8110786350976327e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3480435066524184e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1795, - "real_time": 3.8994129743585287e+05, - "cpu_time": 7.8250780501393904e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3445305830584610e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1795, - "real_time": 3.8851350759905775e+05, - "cpu_time": 7.8017543064067303e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3494717422825365e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1795, - "real_time": 3.8887433192762744e+05, - "cpu_time": 7.8084613704735134e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3482196096644769e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8909232292861311e+05, - "cpu_time": 7.8131788022284827e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3474662980518913e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8892513291500404e+05, - "cpu_time": 7.8110786350976327e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3480435066524184e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3490361276171620e+02, - "cpu_time": 9.2060818951771921e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8507482853375820e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3747472803770926e-03, - "cpu_time": 1.1782761060775196e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3735024675669543e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1299, - "real_time": 5.3515379048964218e+05, - "cpu_time": 1.0677217074673129e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9593918956279824e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1299, - "real_time": 5.3220911950211378e+05, - "cpu_time": 1.0669930100077088e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9702330560982344e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1299, - "real_time": 5.3488983344494598e+05, - "cpu_time": 1.0679922771362439e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9603588149108570e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1299, - "real_time": 5.3171273922258057e+05, - "cpu_time": 1.0675712748267897e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9720723666187265e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1299, - "real_time": 5.3550618468748673e+05, - "cpu_time": 1.0696057775211826e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9581025018636024e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3389433346935385e+05, - "cpu_time": 1.0679768093918476e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9640317270238805e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3488983344494598e+05, - "cpu_time": 1.0677217074673127e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9603588149108570e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7870797484523177e+03, - "cpu_time": 9.8122027589705283e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5818385948730158e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.3472536350770202e-03, - "cpu_time": 9.1876552680558883e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3511875110319883e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 906, - "real_time": 7.6901509700739803e+05, - "cpu_time": 1.5421574713024138e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7270621970374985e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 906, - "real_time": 7.6848581532493362e+05, - "cpu_time": 1.5410280309050770e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7289404152674899e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 906, - "real_time": 7.6907725649306062e+05, - "cpu_time": 1.5414125121412983e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7268417864323134e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 906, - "real_time": 7.6865059568774910e+05, - "cpu_time": 1.5406958366445547e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7283553955013537e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 906, - "real_time": 7.6833746956751810e+05, - "cpu_time": 1.5403547649006736e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7294673018881211e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6871324681613198e+05, - "cpu_time": 1.5411297231788037e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7281334192253556e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6865059568774910e+05, - "cpu_time": 1.5410280309050770e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7283553955013537e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2422036088586776e+02, - "cpu_time": 6.9559236908242042e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1506075873902449e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2177022736206052e-04, - "cpu_time": 4.5135225063835650e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2175634786841037e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 525, - "real_time": 1.3289535679810103e+06, - "cpu_time": 2.6812349047619523e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1560952173612232e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 525, - "real_time": 1.3323117431164496e+06, - "cpu_time": 2.6860283828570922e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1481400818317337e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 525, - "real_time": 1.3292446224728511e+06, - "cpu_time": 2.6789749295237795e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1554041514173331e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 525, - "real_time": 1.3272935327231176e+06, - "cpu_time": 2.6786843790475922e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1600425200557055e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 525, - "real_time": 1.3293195901704687e+06, - "cpu_time": 2.6804400152380890e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1552262006927414e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3294246112927797e+06, - "cpu_time": 2.6810725222857012e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1549816342717476e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3292446224728511e+06, - "cpu_time": 2.6804400152380886e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1554041514173331e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8126178064045685e+03, - "cpu_time": 2.9618453180231363e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2981916393944090e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3634603955781401e-03, - "cpu_time": 1.1047240585264238e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3623507638536681e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 278, - "real_time": 2.5030083145289649e+06, - "cpu_time": 5.0350194784172997e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3514103614069023e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 278, - "real_time": 2.5164984190072729e+06, - "cpu_time": 5.0442161510791481e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3334445738730884e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 278, - "real_time": 2.5071930634393860e+06, - "cpu_time": 5.0427491510790968e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3458165317721667e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 278, - "real_time": 2.5163061561719547e+06, - "cpu_time": 5.0436719172661901e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3336992716186619e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 278, - "real_time": 2.5071004110810566e+06, - "cpu_time": 5.0408274496402610e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3459401797085776e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5100212728457274e+06, - "cpu_time": 5.0412968294963995e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3420621836758800e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5071930634393860e+06, - "cpu_time": 5.0427491510790968e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3458165317721667e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.0655784362805134e+03, - "cpu_time": 3.7382540180824253e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0734736408661176e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4165446332666679e-03, - "cpu_time": 7.4152626685460596e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4157161647980572e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 142, - "real_time": 4.9193103266486395e+06, - "cpu_time": 9.8206041901407950e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4104813248140316e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 142, - "real_time": 4.9162635474767480e+06, - "cpu_time": 9.8224895704222620e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4125949184743838e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 142, - "real_time": 4.9199345357663613e+06, - "cpu_time": 9.8227137746479772e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4100486252479515e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 142, - "real_time": 4.9171052302535567e+06, - "cpu_time": 9.8191208450705577e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4120107694207025e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 142, - "real_time": 4.9175716818533316e+06, - "cpu_time": 9.8211514225351792e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4116871263739290e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9180370643997286e+06, - "cpu_time": 9.8212159605633561e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4113645528661995e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9175716818533316e+06, - "cpu_time": 9.8211514225351792e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4116871263739290e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5371932543570690e+03, - "cpu_time": 1.4691380361985537e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0662089767395507e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1256235653130270e-04, - "cpu_time": 1.4958820191896915e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1254618502843124e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 71, - "real_time": 9.8263367249722220e+06, - "cpu_time": 1.9575984690140534e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4147447761205087e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 71, - "real_time": 9.9034027498162966e+06, - "cpu_time": 1.9676098056338657e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3881720099308715e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 71, - "real_time": 9.8310735758761279e+06, - "cpu_time": 1.9560994619718909e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4130994688451090e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 71, - "real_time": 9.8363603530845176e+06, - "cpu_time": 1.9594643915492989e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4112650203464632e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 71, - "real_time": 9.7852166558445338e+06, - "cpu_time": 1.9475507718310144e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4290944370617018e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8364780119187422e+06, - "cpu_time": 1.9576645800000247e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4112751424609308e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8310735758761279e+06, - "cpu_time": 1.9575984690140534e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4130994688451090e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2540318060303362e+04, - "cpu_time": 7.1918341768254584e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4719448186961358e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.3247509940811928e-03, - "cpu_time": 3.6736804916935096e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3149401828498036e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33, - "real_time": 2.1273506805300713e+07, - "cpu_time": 4.1817427060607314e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1545745896148400e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33, - "real_time": 2.1266510315013655e+07, - "cpu_time": 4.1811944060605057e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1556124162328000e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33, - "real_time": 2.1266970952803437e+07, - "cpu_time": 4.1840820636363074e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1555440663802490e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33, - "real_time": 2.1235106400016584e+07, - "cpu_time": 4.1814746909091644e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1602791498114462e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33, - "real_time": 2.1261346836884815e+07, - "cpu_time": 4.1814329151515558e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1563787804626536e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1260688262003843e+07, - "cpu_time": 4.1819853563636526e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1564778005003986e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1266510315013655e+07, - "cpu_time": 4.1814746909091644e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1556124162328000e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4937778786749910e+04, - "cpu_time": 1.1881322991789211e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2194043424306442e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.0260090372737576e-04, - "cpu_time": 2.8410723566283204e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0312686567249115e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18, - "real_time": 3.8941751130753092e+07, - "cpu_time": 7.7106303222222999e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4466279533589215e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18, - "real_time": 3.8933013669318624e+07, - "cpu_time": 7.6963980277775422e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4474014557411728e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18, - "real_time": 3.8951047799653478e+07, - "cpu_time": 7.7112550500001162e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4458053269928737e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18, - "real_time": 3.8905029495557152e+07, - "cpu_time": 7.7058177444443896e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4498811526496158e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18, - "real_time": 3.8995626899931163e+07, - "cpu_time": 7.7170008722223178e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4418661442326221e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8945293799042709e+07, - "cpu_time": 7.7082204033333331e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4463164065950413e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8941751130753092e+07, - "cpu_time": 7.7106303222223014e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4466279533589215e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2981418200132604e+04, - "cpu_time": 7.7080275824595796e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9175265600847579e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4686530727734043e-04, - "cpu_time": 9.9997498503368292e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4656375558020002e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.4557808538277939e+07, - "cpu_time": 1.4575319166666153e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6003667659060202e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.4644654161400259e+07, - "cpu_time": 1.4579117300000158e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5961779047107100e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.4663338561852768e+07, - "cpu_time": 1.4567496066666761e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5952779660076690e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.4957542121410370e+07, - "cpu_time": 1.4590758011111248e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5811667298963623e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.4704599877198532e+07, - "cpu_time": 1.4573022188888749e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5932921994262943e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4705588652027994e+07, - "cpu_time": 1.4577142546666616e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5932563131894112e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4663338561852783e+07, - "cpu_time": 1.4575319166666156e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5952779660076690e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5068059986270315e+05, - "cpu_time": 8.6982349067209769e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2343041647970537e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0169923372742571e-03, - "cpu_time": 5.9670370093966186e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0133003421556120e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4251177608966827e+08, - "cpu_time": 2.7247816459999967e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7672038531201892e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4231949150562286e+08, - "cpu_time": 2.7210350220000237e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7722936353998208e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4201087951660156e+08, - "cpu_time": 2.7177530860000163e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7804914231042271e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4219372570514679e+08, - "cpu_time": 2.7207201899999517e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7756301084146051e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4230134189128876e+08, - "cpu_time": 2.7217432099999994e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7727747670162029e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4226744294166568e+08, - "cpu_time": 2.7212066307999980e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7736787574110093e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4230134189128876e+08, - "cpu_time": 2.7210350220000237e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.7727747670162029e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8358642448490154e+05, - "cpu_time": 2.5130507774927653e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8703267800015230e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2904317438261544e-03, - "cpu_time": 9.2350604656360209e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2906044984451422e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8911380469799042e+08, - "cpu_time": 5.1516256000002158e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7139071415895743e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8933046758174896e+08, - "cpu_time": 5.1539771049999672e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7111260109397893e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8973567485809326e+08, - "cpu_time": 5.1592246000001293e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7059358483414140e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8938519954681396e+08, - "cpu_time": 5.1551689949999970e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7104241187231150e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8986567258834839e+08, - "cpu_time": 5.1578446049998659e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7042738259140821e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8948616385459900e+08, - "cpu_time": 5.1555681810000354e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7091333891015949e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8938519954681396e+08, - "cpu_time": 5.1551689949999970e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7104241187231150e+09, - "dst_gpu": 1.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0796472289458814e+05, - "cpu_time": 3.0325864940812730e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9454042520786133e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0638322702333726e-03, - "cpu_time": 5.8821576742159123e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0636997482137589e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2644, - "real_time": 2.6328018322048441e+05, - "cpu_time": 5.2964574773071473e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8893926138848425e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2644, - "real_time": 2.6387904421998747e+05, - "cpu_time": 5.3041951021180663e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8805658214614578e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2644, - "real_time": 2.6395608057319390e+05, - "cpu_time": 5.3045459077156079e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8794332669902225e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2644, - "real_time": 2.6307021450524678e+05, - "cpu_time": 5.3005530105900799e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8924969211198059e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2644, - "real_time": 2.6361562277570099e+05, - "cpu_time": 5.3004233623297431e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8844435288695949e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6356022905892273e+05, - "cpu_time": 5.3012349720121291e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8852664304651842e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6361562277570099e+05, - "cpu_time": 5.3005530105900788e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8844435288695949e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8077221751396922e+02, - "cpu_time": 3.3042738529371888e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6148034898810547e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4447256282693623e-03, - "cpu_time": 6.2330265879216888e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4451527560257413e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2647, - "real_time": 2.6308414466031006e+05, - "cpu_time": 5.2962792217604048e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7845816312660882e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2647, - "real_time": 2.6369289436381456e+05, - "cpu_time": 5.3017764185870613e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7666104918792164e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2647, - "real_time": 2.6366086011737707e+05, - "cpu_time": 5.3006624404986412e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7675541189096747e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2647, - "real_time": 2.6312887733568222e+05, - "cpu_time": 5.3032033925196668e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7832582297202535e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2647, - "real_time": 2.6366261834277643e+05, - "cpu_time": 5.3033768039288488e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7675023212334290e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6344587896399212e+05, - "cpu_time": 5.3010596554589248e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7739013586017331e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6366086011737707e+05, - "cpu_time": 5.3017764185870613e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7675541189096747e+06, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1046384700788769e+02, - "cpu_time": 2.8934780567595868e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1653031832780216e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1784729684472387e-03, - "cpu_time": 5.4583012545047311e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1789837252226924e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2647, - "real_time": 2.6311051422602724e+05, - "cpu_time": 5.2953600075557700e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5567602883711815e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2647, - "real_time": 2.6359624225809157e+05, - "cpu_time": 5.3014985606345290e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5538916506971812e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2647, - "real_time": 2.6382629490979254e+05, - "cpu_time": 5.3054126860597858e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5525366800153501e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2647, - "real_time": 2.6307386823741259e+05, - "cpu_time": 5.3026284812996432e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5569771438885523e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2647, - "real_time": 2.6364912539136480e+05, - "cpu_time": 5.3010636607480934e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5535799688012751e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6345120900453778e+05, - "cpu_time": 5.3011926792595652e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5547491463547081e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6359624225809157e+05, - "cpu_time": 5.3014985606345301e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5538916506971812e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3887828335912195e+02, - "cpu_time": 3.6742432308785038e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0003716828457782e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2863037700209794e-03, - "cpu_time": 6.9309746941544818e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2866202162167991e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2630, - "real_time": 2.6450550766615727e+05, - "cpu_time": 5.3201219049429952e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0970999705380209e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2630, - "real_time": 2.6534462822140852e+05, - "cpu_time": 5.3352869581748871e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0873057634181473e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2630, - "real_time": 2.6523397204965464e+05, - "cpu_time": 5.3344773878326861e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0885937938848834e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2630, - "real_time": 2.6485945954396541e+05, - "cpu_time": 5.3378308403043065e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0929610798515454e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2630, - "real_time": 2.6538922073418705e+05, - "cpu_time": 5.3382169315589895e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0867870131790616e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6506655764307460e+05, - "cpu_time": 5.3331868045627733e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0905495241743322e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6523397204965464e+05, - "cpu_time": 5.3352869581748859e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0885937938848834e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7653983843972026e+02, - "cpu_time": 7.4772504639679016e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3939532922386650e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4205482645107952e-03, - "cpu_time": 1.4020229813759362e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4217385153899285e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2607, - "real_time": 2.6747497075003700e+05, - "cpu_time": 5.3851055734559125e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1254329532430589e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2607, - "real_time": 2.6778546099656052e+05, - "cpu_time": 5.3870839355581452e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1183306737517163e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2607, - "real_time": 2.6815694934398431e+05, - "cpu_time": 5.3956808860761137e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1098547101171926e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2607, - "real_time": 2.6826988247678324e+05, - "cpu_time": 5.4022690257000946e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1072826545924008e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2607, - "real_time": 2.6741513796338235e+05, - "cpu_time": 5.3884840314537799e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1268034879324935e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6782048030614952e+05, - "cpu_time": 5.3917246904488094e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1175408959273726e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6778546099656052e+05, - "cpu_time": 5.3884840314537799e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1183306737517163e+07, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8732394216461614e+02, - "cpu_time": 7.1183859854744628e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8460852347945416e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4462073315747194e-03, - "cpu_time": 1.3202428525485273e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4460197954187183e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2581, - "real_time": 2.7153608038734988e+05, - "cpu_time": 5.4731863580008724e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2067641233259317e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2581, - "real_time": 2.7209666831125150e+05, - "cpu_time": 5.4734695970553719e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2042778841568421e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2581, - "real_time": 2.7188887043485505e+05, - "cpu_time": 5.4719354746223358e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2051982836808048e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2581, - "real_time": 2.7225623296534788e+05, - "cpu_time": 5.4708103177063796e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2035720777849238e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2581, - "real_time": 2.7152070130765688e+05, - "cpu_time": 5.4745712863230996e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2068324750999728e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7185971068129229e+05, - "cpu_time": 5.4727946067416121e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2053289688096951e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7188887043485505e+05, - "cpu_time": 5.4731863580008713e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2051982836808048e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2935279485548563e+02, - "cpu_time": 1.4526856382076863e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4601988967260590e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2114807083039747e-03, - "cpu_time": 2.6543763151977396e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2114525863989290e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2485, - "real_time": 2.8059218474476406e+05, - "cpu_time": 5.6455947122736997e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3356316947891372e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2485, - "real_time": 2.8042459261502459e+05, - "cpu_time": 5.6504732354125183e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3370275548539284e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2485, - "real_time": 2.8114409976024221e+05, - "cpu_time": 5.6540163299798116e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3310466076253659e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2485, - "real_time": 2.8053217909956572e+05, - "cpu_time": 5.6389270301810361e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3361312848441583e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2485, - "real_time": 2.8177631003041967e+05, - "cpu_time": 5.6536516659959452e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3258165313089997e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8089387325000332e+05, - "cpu_time": 5.6485325947686029e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3331307346843177e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8059218474476406e+05, - "cpu_time": 5.6504732354125183e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3356316947891372e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6642980696432312e+02, - "cpu_time": 6.3431134468053654e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6979907077387883e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0165260296018811e-03, - "cpu_time": 1.1229666006849369e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0135994258266227e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2331, - "real_time": 2.9755204776961217e+05, - "cpu_time": 5.9843189403688337e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4050108538149297e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2331, - "real_time": 2.9700245249607728e+05, - "cpu_time": 5.9686303474903572e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4131622112356526e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2331, - "real_time": 3.0011115618422069e+05, - "cpu_time": 5.9811568768767850e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.3674484369898790e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2331, - "real_time": 2.9710959517021419e+05, - "cpu_time": 5.9721514628914604e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4115707513555324e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2331, - "real_time": 2.9768836755193258e+05, - "cpu_time": 5.9843297511796863e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4029936768400639e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9789272383441142e+05, - "cpu_time": 5.9781174757614243e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4000371860472119e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9755204776961217e+05, - "cpu_time": 5.9811568768767850e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4050108538149297e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2732966388951768e+03, - "cpu_time": 7.2781762939014743e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8713592579299144e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2743462227125759e-03, - "cpu_time": 1.2174696003233801e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2530532784225313e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2129, - "real_time": 3.2898287594017864e+05, - "cpu_time": 6.6159316439643316e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9683174770369375e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2129, - "real_time": 3.2855435395659244e+05, - "cpu_time": 6.6123197839360544e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9787102755799615e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2129, - "real_time": 3.2906418989625521e+05, - "cpu_time": 6.6138101409113372e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9663484526422250e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2129, - "real_time": 3.2845034281307185e+05, - "cpu_time": 6.6077662752465997e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9812369125518537e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2129, - "real_time": 3.2931347129894479e+05, - "cpu_time": 6.6121362188819854e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9603181420425534e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2887304678100866e+05, - "cpu_time": 6.6123928125880635e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9709862519707060e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2898287594017864e+05, - "cpu_time": 6.6123197839360544e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9683174770369375e+08, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6152996124075509e+02, - "cpu_time": 3.0003403262971500e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7632284982191352e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0992994554567196e-03, - "cpu_time": 4.5374502261652988e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0993907430278855e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1779, - "real_time": 3.9448934203320555e+05, - "cpu_time": 7.9194841708824632e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3290295684486930e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1779, - "real_time": 3.9355625822695688e+05, - "cpu_time": 7.9068177009555302e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3321805689535053e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1779, - "real_time": 3.9405718511151080e+05, - "cpu_time": 7.9079419449129887e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3304870963122683e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1779, - "real_time": 3.9360002057216939e+05, - "cpu_time": 7.9031940078696760e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3320324507042756e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1779, - "real_time": 3.9558893155284069e+05, - "cpu_time": 7.9402874704892770e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3253353624985547e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9425834749933670e+05, - "cpu_time": 7.9155450590219884e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3298130093834596e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9405718511151086e+05, - "cpu_time": 7.9079419449129875e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3304870963122683e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3525481049960854e+02, - "cpu_time": 1.5118086146775461e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8128612036003484e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1185469269005492e-03, - "cpu_time": 1.9099235787362681e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1152306254730306e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1296, - "real_time": 5.4107400514853734e+05, - "cpu_time": 1.0847676435185317e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9379530157101920e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1296, - "real_time": 5.4432301871718571e+05, - "cpu_time": 1.0849447901234501e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9263855540616212e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1296, - "real_time": 5.4085375863288378e+05, - "cpu_time": 1.0842409521604818e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9387421891094663e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1296, - "real_time": 5.4186956814517570e+05, - "cpu_time": 1.0815910925925842e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9351077485109284e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1296, - "real_time": 5.3870796415858530e+05, - "cpu_time": 1.0802866319444869e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9464646334638543e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4136566296047368e+05, - "cpu_time": 1.0831662220679068e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9369306281712124e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4107400514853734e+05, - "cpu_time": 1.0842409521604818e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9379530157101920e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0254843092549443e+03, - "cpu_time": 2.1009504935471941e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2413010651953975e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7414347599707847e-03, - "cpu_time": 1.9396381190102136e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7385443545969433e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 895, - "real_time": 7.7446195603915432e+05, - "cpu_time": 1.5517161050279127e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7078825288275032e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 895, - "real_time": 7.7386628706320375e+05, - "cpu_time": 1.5510817966480583e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7099668703215132e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 895, - "real_time": 7.7419737978271267e+05, - "cpu_time": 1.5517012692737416e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7088079277516928e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 895, - "real_time": 7.7487401528981142e+05, - "cpu_time": 1.5533246860334724e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7064425424249668e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 895, - "real_time": 7.7489923501085467e+05, - "cpu_time": 1.5529485173185002e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7063544590679889e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7445977463714755e+05, - "cpu_time": 1.5521544748603371e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7078908656787333e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7446195603915432e+05, - "cpu_time": 1.5517161050279127e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7078825288275032e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4322794823895248e+02, - "cpu_time": 9.4181999011747484e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5499236382738345e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7230596443387288e-04, - "cpu_time": 6.0678238240573310e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7237300731665416e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 524, - "real_time": 1.3333690101245262e+06, - "cpu_time": 2.6884862347328062e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1456438301414289e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 524, - "real_time": 1.3346499283549213e+06, - "cpu_time": 2.6908540896944511e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1426248268486896e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 524, - "real_time": 1.3332807675327482e+06, - "cpu_time": 2.6876145114503559e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1458520231725907e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 524, - "real_time": 1.3339525330385179e+06, - "cpu_time": 2.6894882480916334e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1442678027276473e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 524, - "real_time": 1.3324719185421939e+06, - "cpu_time": 2.6865966851145984e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1477616463308477e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3335448315185816e+06, - "cpu_time": 2.6886079538167692e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1452300258442407e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3333690101245262e+06, - "cpu_time": 2.6884862347328062e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1456438301414289e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.1228762620058569e+02, - "cpu_time": 1.6482558547557364e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9157343301407949e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.0911909896241626e-04, - "cpu_time": 6.1305176621822416e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0909196287688833e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 280, - "real_time": 2.4959556982919043e+06, - "cpu_time": 5.0087207464287076e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3608801653573842e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 280, - "real_time": 2.4982991753079528e+06, - "cpu_time": 5.0121680321426857e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3577275623789043e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 280, - "real_time": 2.5203551332067167e+06, - "cpu_time": 5.0565766142856972e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3283436486694417e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 280, - "real_time": 2.5202168284782344e+06, - "cpu_time": 5.0552987250000574e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3285263018679380e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 280, - "real_time": 2.5207780052109486e+06, - "cpu_time": 5.0573219535713019e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3277853038463049e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5111209680991517e+06, - "cpu_time": 5.0380172142856903e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3406525964239945e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5202168284782339e+06, - "cpu_time": 5.0552987250000564e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3285263018679380e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2802798773564069e+04, - "cpu_time": 2.5210306157271036e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7064828156856429e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0984396754312601e-03, - "cpu_time": 5.0040135007449462e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1082318990976474e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 140, - "real_time": 4.9603321722575594e+06, - "cpu_time": 9.8841338142855354e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3822767140137529e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 140, - "real_time": 4.9576670097719347e+06, - "cpu_time": 9.8850947714286763e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3840949718750463e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 140, - "real_time": 4.9592087377927136e+06, - "cpu_time": 9.8875392071428392e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3830429181465240e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 140, - "real_time": 4.9627379447753942e+06, - "cpu_time": 9.8915780000002738e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3806370972423592e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 140, - "real_time": 4.9621459163193190e+06, - "cpu_time": 9.8922594071430992e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3810404375300055e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9604183561833836e+06, - "cpu_time": 9.8881210400000848e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3822184277615380e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9603321722575594e+06, - "cpu_time": 9.8875392071428392e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3822767140137529e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0859929689155274e+03, - "cpu_time": 3.6902389812293964e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4223982110224969e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2052762874632201e-04, - "cpu_time": 3.7319921209513882e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2055184826246902e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 71, - "real_time": 9.7929050516284686e+06, - "cpu_time": 1.9607759760564040e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4264022599116502e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 71, - "real_time": 9.8399629973819554e+06, - "cpu_time": 1.9679400718310192e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4100160751547108e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 71, - "real_time": 9.8544848217091095e+06, - "cpu_time": 1.9730953718308996e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4049909870560336e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 71, - "real_time": 9.8275867828600835e+06, - "cpu_time": 1.9649797859154232e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4143104244595423e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 71, - "real_time": 9.8712600137985926e+06, - "cpu_time": 1.9690731253520835e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.3992045547473941e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8372399334756453e+06, - "cpu_time": 1.9671728661971662e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4109848602658663e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8399629973819572e+06, - "cpu_time": 1.9679400718310192e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4100160751547108e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9668721650414423e+04, - "cpu_time": 4.6099204687877951e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0300439891064847e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0159599492387318e-03, - "cpu_time": 2.3434241840166532e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0197846994436638e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33, - "real_time": 2.1243033930659294e+07, - "cpu_time": 4.1840375272727214e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1590997886203170e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33, - "real_time": 2.1230025329824649e+07, - "cpu_time": 4.1839352757575177e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1610355125541573e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33, - "real_time": 2.1228468892249193e+07, - "cpu_time": 4.1868454212118253e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1612672746503339e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33, - "real_time": 2.1267906734437652e+07, - "cpu_time": 4.1865880363636941e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1554052233704433e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33, - "real_time": 2.1286990098429449e+07, - "cpu_time": 4.1837735484846510e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1525764652350397e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1251284997120049e+07, - "cpu_time": 4.1850359618180826e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1578768528860583e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1243033930659294e+07, - "cpu_time": 4.1840375272727214e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1590997886203170e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5454688191307643e+04, - "cpu_time": 1.5398983302500483e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7805662329762192e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1977952483700274e-03, - "cpu_time": 3.6795342842910211e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1971860870765337e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18, - "real_time": 3.8968822608391441e+07, - "cpu_time": 7.7145791166666791e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4442335953742137e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18, - "real_time": 3.9008154844244324e+07, - "cpu_time": 7.7195139833337277e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4407607469750371e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18, - "real_time": 3.8987515494227409e+07, - "cpu_time": 7.7087322666664526e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4425822291721210e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18, - "real_time": 3.8962129089567393e+07, - "cpu_time": 7.7027538833331406e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4448252992400894e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18, - "real_time": 3.9004804566502571e+07, - "cpu_time": 7.7211116944441617e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4410562875955682e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8986285320586629e+07, - "cpu_time": 7.7133381888888344e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4426916316714058e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8987515494227409e+07, - "cpu_time": 7.7145791166666791e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4425822291721210e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0683457618291832e+04, - "cpu_time": 7.6378951777892056e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8265284166855987e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.3053163306558920e-04, - "cpu_time": 9.9021914905685006e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3055243167359433e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.5158007442951202e+07, - "cpu_time": 1.4647766566666734e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5716148569233470e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.5006292098098338e+07, - "cpu_time": 1.4626016777776840e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5788391679050317e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.5145014458232462e+07, - "cpu_time": 1.4632880999999997e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5722324087009573e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.4973865515655935e+07, - "cpu_time": 1.4628473277777073e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5803870342518978e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.4988923139042318e+07, - "cpu_time": 1.4640450955554721e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5796680998108830e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5054420530796066e+07, - "cpu_time": 1.4635117715555075e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5765483135184236e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5006292098098338e+07, - "cpu_time": 1.4632880999999997e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5788391679050317e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9488648554287007e+04, - "cpu_time": 8.9500754393684299e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2627129143398805e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1923168271956526e-03, - "cpu_time": 6.1154789550177358e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1918510643985803e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4775233268737793e+08, - "cpu_time": 2.8249743260000741e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6335867071279302e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4783528447151184e+08, - "cpu_time": 2.8251424019999832e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6315478670686097e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4771163165569305e+08, - "cpu_time": 2.8217991960000288e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6345879195987344e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4803204834461212e+08, - "cpu_time": 2.8238003660001141e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6267208216303811e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4794673621654510e+08, - "cpu_time": 2.8247019759999144e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6288121369179683e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4785560667514801e+08, - "cpu_time": 2.8240836532000232e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6310510904687252e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4783528447151184e+08, - "cpu_time": 2.8247019759999144e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6315478670686097e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3345745651550504e+05, - "cpu_time": 1.3780027642898285e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2767911257692333e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.0262019490896270e-04, - "cpu_time": 4.8794686472137150e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0243597353135529e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.9030250012874603e+08, - "cpu_time": 5.1704995850002432e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6986998855463080e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.9063211381435394e+08, - "cpu_time": 5.1728208399998719e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6945050906723623e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.9048492014408112e+08, - "cpu_time": 5.1702267799998933e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6963771595008163e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.9103539884090424e+08, - "cpu_time": 5.1786173100003910e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6893856495682354e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.9138474166393280e+08, - "cpu_time": 5.1796461349999845e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6849624241422873e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9076793491840363e+08, - "cpu_time": 5.1743621300000775e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6927860418860016e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9063211381435394e+08, - "cpu_time": 5.1728208399998724e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6945050906723623e+09, - "dst_gpu": 2.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3793886256311683e+05, - "cpu_time": 4.4839495426752977e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5586973251509210e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5061456576565527e-03, - "cpu_time": 8.6657049313926357e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5052855112916183e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2679, - "real_time": 2.5997473057642780e+05, - "cpu_time": 5.2290699066813954e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9388443551015151e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2679, - "real_time": 2.5925242379252124e+05, - "cpu_time": 5.2196751325123006e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9498184241452008e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2679, - "real_time": 2.5989334567437123e+05, - "cpu_time": 5.2280868831649818e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9400777936153957e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2679, - "real_time": 2.5926868203523685e+05, - "cpu_time": 5.2206573684212397e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9495707385932156e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2679, - "real_time": 2.5920990088003085e+05, - "cpu_time": 5.2277879022026999e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9504663846692112e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5951981659171762e+05, - "cpu_time": 5.2250554385965242e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9457555392249078e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5926868203523691e+05, - "cpu_time": 5.2277879022026993e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9495707385932156e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7983086099969438e+02, - "cpu_time": 4.5017408401016235e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7718304307209246e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4635909734679443e-03, - "cpu_time": 8.6156805281874954e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4627947355944726e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2687, - "real_time": 2.5978780848174807e+05, - "cpu_time": 5.2266985708967072e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8833568517665314e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2687, - "real_time": 2.5975295658520370e+05, - "cpu_time": 5.2270128284334630e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8844145873204675e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2687, - "real_time": 2.6062546516007840e+05, - "cpu_time": 5.2274212132489862e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8580195482513607e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2687, - "real_time": 2.6013893190966133e+05, - "cpu_time": 5.2322898995161394e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8727162634434542e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2687, - "real_time": 2.6002055808526068e+05, - "cpu_time": 5.2317768328991509e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8763003013341017e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6006514404439047e+05, - "cpu_time": 5.2290398689988907e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8749615104231834e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6002055808526068e+05, - "cpu_time": 5.2274212132489868e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8763003013341017e+06, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5205409152379656e+02, - "cpu_time": 2.7506493068406553e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0650187750050613e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3537150194326102e-03, - "cpu_time": 5.2603333991547323e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3524114036562820e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2684, - "real_time": 2.5972737541218218e+05, - "cpu_time": 5.2257178502235649e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5770382284500159e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2684, - "real_time": 2.5969429799801795e+05, - "cpu_time": 5.2237486587183992e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5772390967287473e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2684, - "real_time": 2.6029028442725414e+05, - "cpu_time": 5.2269852570787707e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5736276937930616e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2684, - "real_time": 2.5973098216184182e+05, - "cpu_time": 5.2259954061099689e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5770163289367335e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2684, - "real_time": 2.5982928652997824e+05, - "cpu_time": 5.2261586997020565e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5764196772050243e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5985444530585487e+05, - "cpu_time": 5.2257211743665516e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5762682050227165e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5973098216184182e+05, - "cpu_time": 5.2259954061099689e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5770163289367335e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4881005294734391e+02, - "cpu_time": 1.1995171542569241e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5075227651680754e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5749777401147988e-04, - "cpu_time": 2.2954097898312121e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5638721910675699e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2669, - "real_time": 2.6140560880127168e+05, - "cpu_time": 5.2634705470217287e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1338271728621561e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2669, - "real_time": 2.6136041436911066e+05, - "cpu_time": 5.2580221281379589e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1343690741286896e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2669, - "real_time": 2.6188601129320191e+05, - "cpu_time": 5.2603981116519438e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1280784947419029e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2669, - "real_time": 2.6142455261427828e+05, - "cpu_time": 5.2609072011992359e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1336000838784933e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2669, - "real_time": 2.6145919659712346e+05, - "cpu_time": 5.2641873698013660e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1331848742053874e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6150715673499717e+05, - "cpu_time": 5.2613970715624467e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1326119399633259e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6142455261427825e+05, - "cpu_time": 5.2609072011992359e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1336000838784933e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1476713940991468e+02, - "cpu_time": 2.4856187220656184e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5700738845167467e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.2126677560703505e-04, - "cpu_time": 4.7242561020536665e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2042523420466668e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2628, - "real_time": 2.6334408334264311e+05, - "cpu_time": 5.3088394977170497e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2215181719812550e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2628, - "real_time": 2.6385401956295123e+05, - "cpu_time": 5.3079531088281074e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2094941843745708e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2628, - "real_time": 2.6465061643096030e+05, - "cpu_time": 5.3148514231356420e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1908036417795815e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2628, - "real_time": 2.6424968088868947e+05, - "cpu_time": 5.3184992503804155e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2001967021869250e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2628, - "real_time": 2.6431914889691339e+05, - "cpu_time": 5.3198513242011936e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1985671747111641e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6408350982443150e+05, - "cpu_time": 5.3139989208524814e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2041159750066988e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6424968088868953e+05, - "cpu_time": 5.3148514231356420e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2001967021869250e+07, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0104036771562386e+02, - "cpu_time": 5.4406305027582323e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1780595227958560e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8972800234619970e-03, - "cpu_time": 1.0238298094884513e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8988354304491932e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2602, - "real_time": 2.6828298882946739e+05, - "cpu_time": 5.3969367255955376e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2213968594493632e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2602, - "real_time": 2.6820416932578036e+05, - "cpu_time": 5.4006851691006438e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2217558020210192e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2602, - "real_time": 2.6881793011858599e+05, - "cpu_time": 5.3997201998459978e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2189663087408184e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2602, - "real_time": 2.6834153103902377e+05, - "cpu_time": 5.4020636664105498e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2211303957729408e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2602, - "real_time": 2.6847727901086089e+05, - "cpu_time": 5.4054334012297716e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2205129655934279e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6842477966474363e+05, - "cpu_time": 5.4009678324364999e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2207524663155138e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6834153103902377e+05, - "cpu_time": 5.4006851691006438e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2211303957729408e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4136453600674213e+02, - "cpu_time": 3.1236382921389469e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0968677223120388e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.9918872731571513e-04, - "cpu_time": 5.7834787931514153e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9851771966729249e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2520, - "real_time": 2.7703065665379638e+05, - "cpu_time": 5.5780854484127637e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3656587610771164e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2520, - "real_time": 2.7698576672091370e+05, - "cpu_time": 5.5773562023808784e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3660421535678759e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2520, - "real_time": 2.7642132133931026e+05, - "cpu_time": 5.5633306507937203e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3708735521003398e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2520, - "real_time": 2.7728995718505408e+05, - "cpu_time": 5.5812201071427402e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3634465764753050e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2520, - "real_time": 2.7656716129202984e+05, - "cpu_time": 5.5784476785713795e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3696233382820138e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7685897263822088e+05, - "cpu_time": 5.5756880174602964e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3671288763005301e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7698576672091370e+05, - "cpu_time": 5.5780854484127637e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3660421535678759e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5636790732816087e+02, - "cpu_time": 7.0614228864181371e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0473953837662743e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2871820766084997e-03, - "cpu_time": 1.2664666430950323e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2873804270973617e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2379, - "real_time": 2.9112648350944545e+05, - "cpu_time": 5.9117090121897019e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.5022355376249182e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2379, - "real_time": 2.9405591218006500e+05, - "cpu_time": 5.9116669861283491e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4573835985225189e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2379, - "real_time": 2.9125083721604571e+05, - "cpu_time": 5.9158196553173230e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.5003132438301855e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2379, - "real_time": 2.9142267070857465e+05, - "cpu_time": 5.9128282051285228e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4976596941242510e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2379, - "real_time": 2.9421234865748830e+05, - "cpu_time": 5.9120878856662090e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4550135505219537e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9241365045432386e+05, - "cpu_time": 5.9128223488860216e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4825211249247658e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9142267070857459e+05, - "cpu_time": 5.9120878856662079e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4976596941242510e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5750645248242301e+03, - "cpu_time": 1.7390872654702693e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4098525493315975e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.3864261205899535e-03, - "cpu_time": 2.9412134558683541e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3761097430902668e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2147, - "real_time": 3.2568002659118240e+05, - "cpu_time": 6.5409198462976108e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0491273211870146e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2147, - "real_time": 3.2503726404931518e+05, - "cpu_time": 6.5428596040988842e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0650445039503860e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2147, - "real_time": 3.2574463548168232e+05, - "cpu_time": 6.5488383977641049e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0475308399895716e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2147, - "real_time": 3.2566467059960973e+05, - "cpu_time": 6.5466808430367894e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0495068598427856e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2147, - "real_time": 3.2444511333972384e+05, - "cpu_time": 6.5377977317188436e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0797641641626811e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2531434201230278e+05, - "cpu_time": 6.5434192845832475e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0581947378264892e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2566467059960973e+05, - "cpu_time": 6.5428596040988842e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0495068598427856e+08, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6434441673421497e+02, - "cpu_time": 4.4206006878719302e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3996208716934740e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7347664822993649e-03, - "cpu_time": 6.7557961604067978e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7368913475414335e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1792, - "real_time": 3.9001302208622033e+05, - "cpu_time": 7.8396780747766059e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3442833195556622e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1792, - "real_time": 3.8912668576683378e+05, - "cpu_time": 7.8239082756700483e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3473452712882185e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1792, - "real_time": 3.8920927849111258e+05, - "cpu_time": 7.8215252734376804e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3470593559140236e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1792, - "real_time": 3.8966293789144402e+05, - "cpu_time": 7.8315029854910832e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3454910616776726e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1792, - "real_time": 3.8917364832156763e+05, - "cpu_time": 7.8249721484377072e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3471826837740812e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8943711451143574e+05, - "cpu_time": 7.8283173515626253e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3462723384419317e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8920927849111258e+05, - "cpu_time": 7.8249721484377072e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3470593559140236e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8741303033344877e+02, - "cpu_time": 7.3480772128030208e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3384598917860782e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.9480253909408115e-04, - "cpu_time": 9.3865346572035119e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9419697899691298e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1324, - "real_time": 5.2792747887315694e+05, - "cpu_time": 1.0628201457704180e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9862122014147656e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1324, - "real_time": 5.3038247063470399e+05, - "cpu_time": 1.0630035611782130e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9770185819776027e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1324, - "real_time": 5.2799840851298615e+05, - "cpu_time": 1.0638474962235966e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9859453799361410e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1324, - "real_time": 5.3111623737537605e+05, - "cpu_time": 1.0656415075528200e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9742872204053893e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1324, - "real_time": 5.2775235839956219e+05, - "cpu_time": 1.0636389682779426e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9868712726928663e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2903539075915725e+05, - "cpu_time": 1.0637903358005981e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9820669312853532e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2799840851298603e+05, - "cpu_time": 1.0636389682779426e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9859453799361410e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5885150135287818e+03, - "cpu_time": 1.1195199079381305e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9438425460706810e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0026630378154643e-03, - "cpu_time": 1.0523877405744532e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9988102077946233e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 907, - "real_time": 7.7022852337854495e+05, - "cpu_time": 1.5439058710033714e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7227659536691957e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 907, - "real_time": 7.7025497654635692e+05, - "cpu_time": 1.5435470837928231e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7226724446535077e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 907, - "real_time": 7.7036841544800135e+05, - "cpu_time": 1.5444359217200219e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7222715235286722e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 907, - "real_time": 7.7038482256395929e+05, - "cpu_time": 1.5448039900771999e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7222135464979115e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 907, - "real_time": 7.7224343380035460e+05, - "cpu_time": 1.5484755843439379e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7156618084527082e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7069603434744338e+05, - "cpu_time": 1.5450336901874708e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7211170553603992e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7036841544800135e+05, - "cpu_time": 1.5444359217200219e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7222715235286722e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.6771689993968448e+02, - "cpu_time": 1.9836014814630212e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0591220092569045e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1258873294636709e-03, - "cpu_time": 1.2838564583160226e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1242155140774486e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 526, - "real_time": 1.3291445882112752e+06, - "cpu_time": 2.6798408022814384e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1556416338756452e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 526, - "real_time": 1.3295692440827056e+06, - "cpu_time": 2.6808280741445776e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1546337422190661e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 526, - "real_time": 1.3302466557662184e+06, - "cpu_time": 2.6804323707224475e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1530272839393778e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 526, - "real_time": 1.3303065753520641e+06, - "cpu_time": 2.6811777167301509e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1528852654809909e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 526, - "real_time": 1.3298207970102364e+06, - "cpu_time": 2.6807679714829386e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1540370021508350e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3298175720845000e+06, - "cpu_time": 2.6806093870723108e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1540449855331831e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3298207970102364e+06, - "cpu_time": 2.6807679714829391e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1540370021508350e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8420591955702093e+02, - "cpu_time": 5.0448712009672755e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1485481294921862e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6411454452209123e-04, - "cpu_time": 1.8819866950018957e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6415083956008545e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 281, - "real_time": 2.5197886861860752e+06, - "cpu_time": 5.0537970071173795e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3290918583720231e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 281, - "real_time": 2.5111965162288463e+06, - "cpu_time": 5.0529553594305590e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3404824934200978e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 281, - "real_time": 2.5189209205771256e+06, - "cpu_time": 5.0523804056938449e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3302387270172954e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 281, - "real_time": 2.5117898267093925e+06, - "cpu_time": 5.0535013380784616e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3396934372449546e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 281, - "real_time": 2.5220451705833878e+06, - "cpu_time": 5.0591255836302619e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3261133059165573e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5167482240569657e+06, - "cpu_time": 5.0543519387901025e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3331239643941860e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5189209205771261e+06, - "cpu_time": 5.0535013380784625e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3302387270172954e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9353274128566718e+03, - "cpu_time": 2.7228905795657261e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5390696764111640e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9609937003952612e-03, - "cpu_time": 5.3872199889141959e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9618441276904853e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 142, - "real_time": 4.9390061135390699e+06, - "cpu_time": 9.8491714295769706e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3968809947429285e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 142, - "real_time": 4.9438174407352023e+06, - "cpu_time": 9.8514457464793399e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3935751473673015e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 142, - "real_time": 4.9466940207065828e+06, - "cpu_time": 9.8562979436621051e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3916017303216081e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 142, - "real_time": 4.9429881668479089e+06, - "cpu_time": 9.8504212323940042e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3941444797547741e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 142, - "real_time": 4.9426523594736634e+06, - "cpu_time": 9.8524235000002291e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3943750803842869e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9430316202604864e+06, - "cpu_time": 9.8519519704225305e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3941154865141797e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9429881668479089e+06, - "cpu_time": 9.8514457464793418e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3941444797547741e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7559536517885354e+03, - "cpu_time": 2.7129620604245943e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8925645263504228e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.5754319686979930e-04, - "cpu_time": 2.7537304978439116e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5760168853126501e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 71, - "real_time": 9.8554184660315514e+06, - "cpu_time": 1.9693154802817382e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4046684182565465e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 71, - "real_time": 9.7983188166374899e+06, - "cpu_time": 1.9549479070422061e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4245091048705997e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 71, - "real_time": 9.8253137392687127e+06, - "cpu_time": 1.9642050112674695e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4151003103232632e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 71, - "real_time": 9.8228392938912753e+06, - "cpu_time": 1.9621011492958274e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4159605991790137e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 71, - "real_time": 9.8413676679344252e+06, - "cpu_time": 1.9667988169014510e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4095293593520055e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8286515967526920e+06, - "cpu_time": 1.9634736729577385e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4139535583962860e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8253137392687146e+06, - "cpu_time": 1.9642050112674698e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4151003103232632e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1466051475939708e+04, - "cpu_time": 5.4838548583085263e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4590578936270494e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1840281207070075e-03, - "cpu_time": 2.7929352625582970e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1848738613570837e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33, - "real_time": 2.1231650233720288e+07, - "cpu_time": 4.1837386606058508e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1607935917019362e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33, - "real_time": 2.1211713326699805e+07, - "cpu_time": 4.1774237878788278e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1637644242310262e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33, - "real_time": 2.1239451668930776e+07, - "cpu_time": 4.1840493363638006e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1596326047422085e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33, - "real_time": 2.1200401482708525e+07, - "cpu_time": 4.1802802999999397e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1654525059223685e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33, - "real_time": 2.1187029778957367e+07, - "cpu_time": 4.1745876878790669e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1674503080489125e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1214049298203357e+07, - "cpu_time": 4.1800159545454971e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1634186869292908e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1211713326699808e+07, - "cpu_time": 4.1802802999999389e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1637644242310262e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1661298557099377e+04, - "cpu_time": 4.0737573206466659e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2301496132779978e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0210826915978697e-03, - "cpu_time": 9.7457937121429351e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0210945603326008e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18, - "real_time": 3.8975346212585770e+07, - "cpu_time": 7.7138258777779356e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4436571074424205e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18, - "real_time": 3.8890431117680341e+07, - "cpu_time": 7.7084337055560410e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4511761413460402e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18, - "real_time": 3.8904768932196826e+07, - "cpu_time": 7.6995463722223818e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4499042581107330e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18, - "real_time": 3.8917266660266452e+07, - "cpu_time": 7.6958717055554688e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4487963703019490e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18, - "real_time": 3.8823710754513741e+07, - "cpu_time": 7.6883175388894022e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4571071489964547e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8902304735448629e+07, - "cpu_time": 7.7011990400002465e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4501282052395196e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8904768932196833e+07, - "cpu_time": 7.6995463722223833e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4499042581107330e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4504553663841871e+04, - "cpu_time": 1.0109677193947601e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8348440864375345e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4010623286845041e-03, - "cpu_time": 1.3127406708277048e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4013520074689177e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.4187412858009338e+07, - "cpu_time": 1.4448221766666496e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6183423259922924e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.3983037637339696e+07, - "cpu_time": 1.4437737866666743e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6283378538179808e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.4088836709658310e+07, - "cpu_time": 1.4454683855554625e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6231565769071717e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.3971963591045797e+07, - "cpu_time": 1.4430469911111584e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6288810377408137e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.3913473221990794e+07, - "cpu_time": 1.4416323822222745e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6317527008071222e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4028944803608790e+07, - "cpu_time": 1.4437487444444439e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6260940990530763e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.3983037637339696e+07, - "cpu_time": 1.4437737866666743e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.6283378538179808e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0884298017520415e+05, - "cpu_time": 1.5067760445968591e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3277635659251995e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4702759908837473e-03, - "cpu_time": 1.0436553107976334e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4692844202020294e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4720145463943481e+08, - "cpu_time": 2.8118995520001137e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6471848278608923e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4738731086254120e+08, - "cpu_time": 2.8173941140000808e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6425857073999095e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4757800400257111e+08, - "cpu_time": 2.8134892519999540e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6378789347946911e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4745265841484070e+08, - "cpu_time": 2.8172125339999640e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6409713990342369e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4745665192604065e+08, - "cpu_time": 2.8191036400000942e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6408727920207806e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4741521596908572e+08, - "cpu_time": 2.8158198184000415e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6418987322221026e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4745265841484070e+08, - "cpu_time": 2.8172125339999640e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6409713990342369e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3792336651228444e+05, - "cpu_time": 3.0000656689237867e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4090326146401120e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.3561146728033957e-04, - "cpu_time": 1.0654324006528352e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3605914532392622e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8837114572525024e+08, - "cpu_time": 5.1388988299999028e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7234717825167675e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8792530298233032e+08, - "cpu_time": 5.1305311400000167e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7292374545695777e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8815858066082001e+08, - "cpu_time": 5.1314214149999774e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7262184646302752e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8777793049812317e+08, - "cpu_time": 5.1307543600000829e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7311472152900300e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8791844844818115e+08, - "cpu_time": 5.1308785950004679e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7293262372982306e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8803028166294098e+08, - "cpu_time": 5.1324968680000895e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7278802308609767e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8792530298233032e+08, - "cpu_time": 5.1308785950004673e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7292374545695777e+09, - "dst_gpu": 3.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3444468618520387e+05, - "cpu_time": 3.5937774277145654e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0332351485237670e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.1395846586559907e-04, - "cpu_time": 7.0020060803561762e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1366217814975855e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2666, - "real_time": 2.6169499363469004e+05, - "cpu_time": 5.2706671642909327e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9129521959042149e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2666, - "real_time": 2.6224347031914571e+05, - "cpu_time": 5.2641826969240827e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9047683389554368e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2666, - "real_time": 2.6276554574654420e+05, - "cpu_time": 5.2737489009754418e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8970101543971822e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2666, - "real_time": 2.6227497859978146e+05, - "cpu_time": 5.2800663878471975e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9042992414559410e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2666, - "real_time": 2.6288155410599470e+05, - "cpu_time": 5.2789634733685653e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8952904226483684e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6237210848123126e+05, - "cpu_time": 5.2735257246812445e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9028640706722289e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6227497859978152e+05, - "cpu_time": 5.2737489009754406e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9042992414559410e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7402379484259365e+02, - "cpu_time": 6.4780924713000559e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0548689520200005e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8066851601968310e-03, - "cpu_time": 1.2284177245938477e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8076132871327161e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2668, - "real_time": 2.6166643780244951e+05, - "cpu_time": 5.2749817766118643e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8267584379551951e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2668, - "real_time": 2.6205582154992930e+05, - "cpu_time": 5.2739749062969512e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8151288068591757e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2668, - "real_time": 2.6243375757622923e+05, - "cpu_time": 5.2675656184407906e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8038740858447542e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2668, - "real_time": 2.6192047020479426e+05, - "cpu_time": 5.2681232983505446e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8191673922953764e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2668, - "real_time": 2.6252479104171932e+05, - "cpu_time": 5.2677703073463228e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8011680034992984e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6212025563502437e+05, - "cpu_time": 5.2704831814092945e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8132193452907596e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6205582154992927e+05, - "cpu_time": 5.2681232983505458e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8151288068591757e+06, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5775304228415240e+02, - "cpu_time": 3.6698231867814985e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0664204727989272e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3648431763407362e-03, - "cpu_time": 6.9629729580129504e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3648925310687557e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2667, - "real_time": 2.6205064950861459e+05, - "cpu_time": 5.2735928646419174e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5630566104990132e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2667, - "real_time": 2.6145744877600259e+05, - "cpu_time": 5.2653088638919964e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5666029096417710e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2667, - "real_time": 2.6206402959908632e+05, - "cpu_time": 5.2651590776153025e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5629768061897650e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2667, - "real_time": 2.6150754108423676e+05, - "cpu_time": 5.2662270416197414e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5663028236270240e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2667, - "real_time": 2.6189149306744148e+05, - "cpu_time": 5.2601746381698386e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5640065097285198e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6179423240707637e+05, - "cpu_time": 5.2660924971877586e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5645891319372186e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6189149306744145e+05, - "cpu_time": 5.2653088638919953e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5640065097285198e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9309342345589107e+02, - "cpu_time": 4.8161193601108027e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7521204842722003e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1195564576080732e-03, - "cpu_time": 9.1455274716172291e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1198598076050720e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2661, - "real_time": 2.6389422666742397e+05, - "cpu_time": 5.3110686997371749e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1042740508014489e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2661, - "real_time": 2.6401790714093333e+05, - "cpu_time": 5.3107306726797856e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1028198385146253e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2661, - "real_time": 2.6330268469639821e+05, - "cpu_time": 5.3074422886132437e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1112481855039969e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2661, - "real_time": 2.6329144536799652e+05, - "cpu_time": 5.2993403344608273e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1113809977951340e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2661, - "real_time": 2.6379850165350083e+05, - "cpu_time": 5.3067659263434785e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1054005040408403e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6366095310525061e+05, - "cpu_time": 5.3070695843669027e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1070247153312095e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6379850165350083e+05, - "cpu_time": 5.3074422886132437e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1054005040408403e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4119076855123166e+02, - "cpu_time": 4.7267566083316012e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0218187398939925e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2940511840410136e-03, - "cpu_time": 8.9065284206094920e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2944276625959398e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2633, - "real_time": 2.6694981824453501e+05, - "cpu_time": 5.3700512305354525e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1374831074024953e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2633, - "real_time": 2.6679649669022654e+05, - "cpu_time": 5.3687408963157958e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1410101718926318e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2633, - "real_time": 2.6614799364436342e+05, - "cpu_time": 5.3595678199773817e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1559735152063154e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2633, - "real_time": 2.6621882686305873e+05, - "cpu_time": 5.3673506874286104e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1543355866517372e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2633, - "real_time": 2.6683009848286188e+05, - "cpu_time": 5.3611228256741492e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1402368372818038e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6658864678500913e+05, - "cpu_time": 5.3653666919862782e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1458078436869971e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6679649669022654e+05, - "cpu_time": 5.3673506874286092e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1410101718926318e+07, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7512907567220179e+02, - "cpu_time": 4.7144382495908349e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6518535398491353e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4071457288078934e-03, - "cpu_time": 8.7867959828958730e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4077650587036104e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2596, - "real_time": 2.7092899093964067e+05, - "cpu_time": 5.4489546186441276e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2094682036925413e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2596, - "real_time": 2.7042267045765993e+05, - "cpu_time": 5.4436929815100692e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2117327273095797e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2596, - "real_time": 2.7093077749553823e+05, - "cpu_time": 5.4478549075498944e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2094602282880037e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2596, - "real_time": 2.7042402805717813e+05, - "cpu_time": 5.4448756779659714e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2117266440936075e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2596, - "real_time": 2.7130168860578025e+05, - "cpu_time": 5.4475959129429585e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2078067102491987e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7080163111115946e+05, - "cpu_time": 5.4465948197226052e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2100389027265865e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7092899093964067e+05, - "cpu_time": 5.4475959129429585e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2094682036925413e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7721083485105117e+02, - "cpu_time": 2.2099079900600981e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6852861318630734e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3929415170184575e-03, - "cpu_time": 4.0574121321781167e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3927536776426031e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2504, - "real_time": 2.7902752549743454e+05, - "cpu_time": 5.6196241733226285e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3487288532973981e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2504, - "real_time": 2.8009749810433033e+05, - "cpu_time": 5.6238349081470724e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3397567077014461e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2504, - "real_time": 2.7972011074556573e+05, - "cpu_time": 5.6210641054312570e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3429134153179196e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2504, - "real_time": 2.7972017893732822e+05, - "cpu_time": 5.6191801238019241e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3429128441492760e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2504, - "real_time": 2.7979244616592285e+05, - "cpu_time": 5.6256523362616717e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3423076962247851e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7967155189011630e+05, - "cpu_time": 5.6218711293929105e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3433239033381650e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7972017893732816e+05, - "cpu_time": 5.6210641054312570e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3429128441492760e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9228119695581319e+02, - "cpu_time": 2.7881697705334807e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2904602922691533e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4026496234766897e-03, - "cpu_time": 4.9595049519297082e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4041850072803645e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2365, - "real_time": 2.9601690371227439e+05, - "cpu_time": 5.9582558900633873e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4278552459761125e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2365, - "real_time": 2.9695396598066197e+05, - "cpu_time": 5.9468418731498485e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4138827904570091e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2365, - "real_time": 2.9582294794715091e+05, - "cpu_time": 5.9540224439749611e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4307583610253304e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2365, - "real_time": 2.9550740429117531e+05, - "cpu_time": 5.9495250866809685e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4354895375430077e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2365, - "real_time": 2.9733742511709151e+05, - "cpu_time": 5.9486042537000438e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4081904573023003e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9632772940967081e+05, - "cpu_time": 5.9514499095138418e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4232352784607530e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9601690371227439e+05, - "cpu_time": 5.9495250866809697e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4278552459761125e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8038578657307460e+02, - "cpu_time": 4.6361623111641677e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1639624266787996e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6335226478052523e-03, - "cpu_time": 7.7899711526646848e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6314730133094985e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2141, - "real_time": 3.2713877553777531e+05, - "cpu_time": 6.5896225128441292e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0132353484868300e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2141, - "real_time": 3.2691787533041841e+05, - "cpu_time": 6.5921676459600206e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0186499357078290e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2141, - "real_time": 3.2756587354286230e+05, - "cpu_time": 6.5883382905184536e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0027872612223816e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2141, - "real_time": 3.2784902863791725e+05, - "cpu_time": 6.5943311583376094e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9958754518536913e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2141, - "real_time": 3.2722158501592855e+05, - "cpu_time": 6.5876265903784696e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0112074509766614e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2733862761298037e+05, - "cpu_time": 6.5904172396077367e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0083510896494794e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2722158501592855e+05, - "cpu_time": 6.5896225128441281e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0112074509766614e+08, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6838235019902862e+02, - "cpu_time": 2.7894455194039892e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0094220076539868e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1253861265483620e-03, - "cpu_time": 4.2325780265317734e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1250033754512034e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1786, - "real_time": 3.9252218450622971e+05, - "cpu_time": 7.8975832082865830e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3356901105080826e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1786, - "real_time": 3.9497037302618712e+05, - "cpu_time": 7.9470358006719197e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3274109548597431e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1786, - "real_time": 3.9176259019132075e+05, - "cpu_time": 7.8803482530791103e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3382798999362323e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1786, - "real_time": 3.9165087614843593e+05, - "cpu_time": 7.8787540145581041e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3386616293468843e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1786, - "real_time": 3.9184285392778774e+05, - "cpu_time": 7.8797045688685961e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3380057713049948e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9254977555999230e+05, - "cpu_time": 7.8966851690928638e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3356096731911874e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9184285392778774e+05, - "cpu_time": 7.8803482530791103e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3380057713049948e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3953021635571522e+03, - "cpu_time": 2.9209392695588913e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7278770568786999e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5544592060119829e-03, - "cpu_time": 3.6989435529116281e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5398643419393104e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1316, - "real_time": 5.3291084793485457e+05, - "cpu_time": 1.0685649946808373e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9676386849009733e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1316, - "real_time": 5.3073955025017192e+05, - "cpu_time": 1.0682174825228236e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9756884511541266e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1316, - "real_time": 5.3305956147580000e+05, - "cpu_time": 1.0684319293313357e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9670897509031990e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1316, - "real_time": 5.3064471448978304e+05, - "cpu_time": 1.0682126641337532e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9760415422364283e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1316, - "real_time": 5.3303499810827896e+05, - "cpu_time": 1.0690030744681135e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9671803985129616e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3207793445177784e+05, - "cpu_time": 1.0684860290273728e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9707277655415380e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3291084793485457e+05, - "cpu_time": 1.0684319293313357e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9676386849009733e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2667575791525558e+03, - "cpu_time": 3.2532442628999740e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6959026569127264e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3807745014980731e-03, - "cpu_time": 3.0447232575060951e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3828266587710735e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 903, - "real_time": 7.7229960004727903e+05, - "cpu_time": 1.5491514684385913e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7154643092805119e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 903, - "real_time": 7.7209192059226625e+05, - "cpu_time": 1.5484970199334889e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7161947225031052e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 903, - "real_time": 7.7176837959395896e+05, - "cpu_time": 1.5480220586932159e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7173334065634418e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 903, - "real_time": 7.7201201455927512e+05, - "cpu_time": 1.5479101373200519e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7164758584712162e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 903, - "real_time": 7.7195533022443333e+05, - "cpu_time": 1.5478720775193858e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7166753280792651e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7202544900344277e+05, - "cpu_time": 1.5482905523809469e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7164287249795084e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7201201455927524e+05, - "cpu_time": 1.5480220586932159e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7164758584712162e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9413853015435285e+02, - "cpu_time": 5.4215564957094170e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8306994827762700e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5146649039219316e-04, - "cpu_time": 3.5016402363059035e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5145881502294147e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 525, - "real_time": 1.3315677662779177e+06, - "cpu_time": 2.6856290914284252e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1498990184511471e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 525, - "real_time": 1.3311700591640105e+06, - "cpu_time": 2.6858089504763228e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1508400982471538e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 525, - "real_time": 1.3320578368646759e+06, - "cpu_time": 2.6852799904762446e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1487401552115192e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 525, - "real_time": 1.3310051862416521e+06, - "cpu_time": 2.6855659676190647e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1512303959110932e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 525, - "real_time": 1.3324488457735807e+06, - "cpu_time": 2.6862295619048383e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1478161531709013e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3316499388643675e+06, - "cpu_time": 2.6857027123809797e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1497051641983628e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3315677662779179e+06, - "cpu_time": 2.6856290914284256e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1498990184511471e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.0360911058360466e+02, - "cpu_time": 3.5059589657124815e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4275496100941640e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5327911860857604e-04, - "cpu_time": 1.3054158785148312e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5323277439445424e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 280, - "real_time": 2.5202628033834375e+06, - "cpu_time": 5.0582372500002747e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3284655825330377e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 280, - "real_time": 2.5245536817237735e+06, - "cpu_time": 5.0600333500000266e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3228083287467394e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 280, - "real_time": 2.5194228211018657e+06, - "cpu_time": 5.0556139214287605e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3295753018269696e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 280, - "real_time": 2.5246896972281062e+06, - "cpu_time": 5.0600923178572133e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3226293152817855e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 280, - "real_time": 2.5224462176473546e+06, - "cpu_time": 5.0614597000000160e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3255844827581382e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5222750442169076e+06, - "cpu_time": 5.0590873078572582e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3258126022293344e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5224462176473541e+06, - "cpu_time": 5.0600333500000257e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3255844827581382e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4102037396678552e+03, - "cpu_time": 2.2539020009220390e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1783339261191548e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5556737366687657e-04, - "cpu_time": 4.4551553744121155e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5565634816245431e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 144, - "real_time": 4.8487175728142671e+06, - "cpu_time": 9.7048982916668877e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4601347156341496e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 144, - "real_time": 4.8472431177894277e+06, - "cpu_time": 9.6995422083333936e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4611872341264381e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 144, - "real_time": 4.8480053665116429e+06, - "cpu_time": 9.6989988124999776e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4606430339147825e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 144, - "real_time": 4.8467242547000451e+06, - "cpu_time": 9.7008470763889756e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4615577694007502e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 144, - "real_time": 4.8510265058009988e+06, - "cpu_time": 9.7022702916665561e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4584878025171199e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8483433635232765e+06, - "cpu_time": 9.7013113361111581e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4604021111186481e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8480053665116429e+06, - "cpu_time": 9.7008470763889756e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.4606430339147825e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6797009486704974e+03, - "cpu_time": 2.3705991582074466e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1985497252262835e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4644843046963234e-04, - "cpu_time": 2.4435863112478136e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4636140157677427e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72, - "real_time": 9.5066479019199815e+06, - "cpu_time": 1.9020701972222138e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5295755503076200e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72, - "real_time": 9.5140456687659025e+06, - "cpu_time": 1.9009131847222231e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5268310840841751e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72, - "real_time": 9.5344479195773602e+06, - "cpu_time": 1.9018272166666370e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5192842084859161e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72, - "real_time": 9.5005234858642016e+06, - "cpu_time": 1.9007991513889682e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5318508553687100e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72, - "real_time": 9.5156656009041592e+06, - "cpu_time": 1.9021273513888877e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5262306818360372e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5142661154063232e+06, - "cpu_time": 1.9015474202777863e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5267544760164919e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5140456687659025e+06, - "cpu_time": 1.9018272166666370e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.5268310840841751e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2808292425399844e+04, - "cpu_time": 6.4227387339989373e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7438557306899624e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3462196947234373e-03, - "cpu_time": 3.3776379518637908e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3451051846535686e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 34, - "real_time": 2.0585481022648953e+07, - "cpu_time": 4.0865759176470228e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.2600095147722902e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 34, - "real_time": 2.0566474098493069e+07, - "cpu_time": 4.0864190941175930e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.2630223186830621e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 34, - "real_time": 2.0541881320669372e+07, - "cpu_time": 4.0801206941179156e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.2669288149608107e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 34, - "real_time": 2.0451019737212095e+07, - "cpu_time": 4.0686905000002831e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.2814434127160225e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 34, - "real_time": 2.0540573195937801e+07, - "cpu_time": 4.0818334088238075e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.2671368690563979e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0537085874992259e+07, - "cpu_time": 4.0807279229413256e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.2677081860377173e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0541881320669372e+07, - "cpu_time": 4.0818334088238075e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.2669288149608107e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1595289940026116e+04, - "cpu_time": 7.2986102847817907e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2282617600365635e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5122984952238537e-03, - "cpu_time": 1.7885559690833460e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5180528038563324e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 19, - "real_time": 3.7531883896965727e+07, - "cpu_time": 7.4162388210526705e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5760988808465023e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 19, - "real_time": 3.7481709922614850e+07, - "cpu_time": 7.4150598736842334e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5808859381577678e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 19, - "real_time": 3.7499428971817620e+07, - "cpu_time": 7.4169512052626967e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5791939152158880e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 19, - "real_time": 3.7517315659083821e+07, - "cpu_time": 7.4247911157894313e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5774875052262101e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 19, - "real_time": 3.7420135383543216e+07, - "cpu_time": 7.4081775947368100e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5867782578634615e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7490094766805038e+07, - "cpu_time": 7.4162437221051693e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5800888994619660e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7499428971817620e+07, - "cpu_time": 7.4162388210526690e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.5791939152158880e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3413870704274377e+04, - "cpu_time": 5.9165531145480913e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1494362217920641e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1580090947840023e-03, - "cpu_time": 7.9778299314961347e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1590316157835249e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.4951936801274613e+07, - "cpu_time": 1.4633796811110893e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5814345493395581e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.5065947241253316e+07, - "cpu_time": 1.4639460100000989e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5759950532200613e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.5083636575275004e+07, - "cpu_time": 1.4634326377778155e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5751525664434276e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.4672662549548686e+07, - "cpu_time": 1.4582424377777493e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5948290423135905e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.4863457017474711e+07, - "cpu_time": 1.4621250733332798e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5856673829174294e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4927528036965281e+07, - "cpu_time": 1.4622251680000067e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5826157188468142e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4951936801274627e+07, - "cpu_time": 1.4633796811110896e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5814345493395581e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6821641703233420e+05, - "cpu_time": 2.3250989195529689e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0530264842380844e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2450549409470059e-03, - "cpu_time": 1.5901100394361137e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2478063839987345e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4585339426994324e+08, - "cpu_time": 2.7974162959999377e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6808941930166364e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4659825861454010e+08, - "cpu_time": 2.8008278139998311e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6621916049605203e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4629303812980652e+08, - "cpu_time": 2.7961166800000679e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6698322685979891e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4635931253433228e+08, - "cpu_time": 2.7972630680001199e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6681704956359601e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4618510007858276e+08, - "cpu_time": 2.7940168420000190e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6725419465554390e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4625782072544098e+08, - "cpu_time": 2.7971281399999952e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6707261017533092e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4629303812980652e+08, - "cpu_time": 2.7972630680001199e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6698322685979891e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7216165212885983e+05, - "cpu_time": 2.4744723540030752e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8347470348038487e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8608348653011099e-03, - "cpu_time": 8.8464747775304970e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8619605073609976e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8482203185558319e+08, - "cpu_time": 5.0821744750004429e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7698692653959875e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8404362499713898e+08, - "cpu_time": 5.0777224800003749e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7802003970721583e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8500491380691528e+08, - "cpu_time": 5.0887548650001693e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7674502157090425e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8531563282012939e+08, - "cpu_time": 5.0925604550002390e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7633473265620728e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8529836237430573e+08, - "cpu_time": 5.0914575849998301e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7635751395981455e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8489691317081451e+08, - "cpu_time": 5.0865339720002109e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7688884688674812e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8500491380691528e+08, - "cpu_time": 5.0887548650001687e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7674502157090425e+09, - "dst_gpu": 4.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2006241545315209e+05, - "cpu_time": 6.3667188053411467e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8906817454530578e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8254406819119880e-03, - "cpu_time": 1.2516811723637265e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8283060914040920e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2695, - "real_time": 2.5971246484134879e+05, - "cpu_time": 5.2075980853434908e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9428219227965567e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2695, - "real_time": 2.5907465601676874e+05, - "cpu_time": 5.2087298515773419e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9525286484746742e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2695, - "real_time": 2.5965831492395108e+05, - "cpu_time": 5.2017878181818296e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9436441706090169e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2695, - "real_time": 2.6025503830844277e+05, - "cpu_time": 5.2077152653061145e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9346020221379939e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2695, - "real_time": 2.5958344802529950e+05, - "cpu_time": 5.2128076994431094e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9447815636542402e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5965678442316217e+05, - "cpu_time": 5.2077277439703775e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9436756655344963e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5965831492395108e+05, - "cpu_time": 5.2077152653061145e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9436441706090169e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1989941395670473e+02, - "cpu_time": 3.9404902206514350e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.3768956137337727e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6171324577153954e-03, - "cpu_time": 7.5666210185696087e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6169929158891660e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2693, - "real_time": 2.5899951178317695e+05, - "cpu_time": 5.2115318343855278e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.9073508127478492e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2693, - "real_time": 2.5972443150520333e+05, - "cpu_time": 5.2123505458595324e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8852805187831167e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2693, - "real_time": 2.5981331257166178e+05, - "cpu_time": 5.2157559004825738e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8825829967243122e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2693, - "real_time": 2.5899196625038749e+05, - "cpu_time": 5.2125786817678623e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.9075811873640921e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2693, - "real_time": 2.5905786163462041e+05, - "cpu_time": 5.2085157630896772e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.9055697714687930e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5931741674900995e+05, - "cpu_time": 5.2121465451170353e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8976730574176330e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5905786163462038e+05, - "cpu_time": 5.2123505458595336e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.9055697714687930e+06, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1410268366210994e+02, - "cpu_time": 2.5892205358258428e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2604295156671173e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5968949901383396e-03, - "cpu_time": 4.9676664180740219e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5959504863059630e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2711, - "real_time": 2.5905852601717442e+05, - "cpu_time": 5.2140400295093947e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5811098993624529e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2711, - "real_time": 2.5981041581190613e+05, - "cpu_time": 5.2287093212836882e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5765341767380737e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2711, - "real_time": 2.5966016427587686e+05, - "cpu_time": 5.2145219218002661e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5774464332727566e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2711, - "real_time": 2.5895281448515083e+05, - "cpu_time": 5.2072746329771436e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5817553511220390e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2711, - "real_time": 2.5954530671215194e+05, - "cpu_time": 5.2077187458507140e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5781445065938557e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5940544546045206e+05, - "cpu_time": 5.2144529302842414e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5789980734178357e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5954530671215191e+05, - "cpu_time": 5.2140400295093947e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5781445065938557e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7870560139313091e+02, - "cpu_time": 8.6645415830896582e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3059347057511190e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4598984254972662e-03, - "cpu_time": 1.6616396195213812e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4603784162698725e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2674, - "real_time": 2.6158245190744349e+05, - "cpu_time": 5.2471932946903165e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1317085455329396e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2674, - "real_time": 2.6229222637255344e+05, - "cpu_time": 5.2521803253550967e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1232340025069151e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2674, - "real_time": 2.6223848879442841e+05, - "cpu_time": 5.2486457778610568e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1238740116527278e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2674, - "real_time": 2.6092210349586091e+05, - "cpu_time": 5.2411389715780522e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1396343545612849e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2674, - "real_time": 2.6153512565065915e+05, - "cpu_time": 5.2474433021694410e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1322752458659481e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6171407924418911e+05, - "cpu_time": 5.2473203343307925e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1301452320239630e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6158245190744349e+05, - "cpu_time": 5.2474433021694410e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1317085455329396e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6697336989319820e+02, - "cpu_time": 3.9880076146029535e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7844980102851012e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1663846726571812e-03, - "cpu_time": 7.6000841582155021e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1674706786362821e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2648, - "real_time": 2.6465799119882711e+05, - "cpu_time": 5.3002514803624817e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1906311333298638e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2648, - "real_time": 2.6484560150212789e+05, - "cpu_time": 5.3039852114801726e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1862458379805736e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2648, - "real_time": 2.6404952904381126e+05, - "cpu_time": 5.2925826925980160e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2048965053376615e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2648, - "real_time": 2.6401381872077694e+05, - "cpu_time": 5.3004322809669119e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2057357752655528e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2648, - "real_time": 2.6396668945271045e+05, - "cpu_time": 5.2913530324777425e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2068437627374150e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6430672598365077e+05, - "cpu_time": 5.2977209395770659e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1988706029302135e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6404952904381126e+05, - "cpu_time": 5.3002514803624828e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.2048965053376615e+07, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1271777542042776e+02, - "cpu_time": 5.4760372107565547e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6732481314447839e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5615106800042512e-03, - "cpu_time": 1.0336590532444550e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5604855708509593e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2608, - "real_time": 2.6884231574178470e+05, - "cpu_time": 5.3849750268399506e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2188557411279228e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2608, - "real_time": 2.6809679517892771e+05, - "cpu_time": 5.3789777300606226e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2222451215103355e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2608, - "real_time": 2.6816728108527180e+05, - "cpu_time": 5.3773023734666081e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2219238628735040e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2608, - "real_time": 2.6754403111533448e+05, - "cpu_time": 5.3923887346629193e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2247703625977801e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2608, - "real_time": 2.6825372986233025e+05, - "cpu_time": 5.3888949501536658e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2215300796308321e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6818083059672976e+05, - "cpu_time": 5.3845077630367537e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2218650335480750e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6816728108527174e+05, - "cpu_time": 5.3849750268399506e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2219238628735040e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6250297842367428e+02, - "cpu_time": 6.4045757780206327e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1069468212914155e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7245937280250710e-03, - "cpu_time": 1.1894449891940693e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7243695199077947e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2524, - "real_time": 2.7661392231250071e+05, - "cpu_time": 5.5525479041199235e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3692227582804602e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2524, - "real_time": 2.7721481615081191e+05, - "cpu_time": 5.5668834746437729e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3640872053659189e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2524, - "real_time": 2.7724403976359469e+05, - "cpu_time": 5.5669219770209561e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3638380127443820e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2524, - "real_time": 2.7666527001377603e+05, - "cpu_time": 5.5568726505542092e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3687830422928312e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2524, - "real_time": 2.7660429284204217e+05, - "cpu_time": 5.5556156339145184e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3693052384196013e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7686846821654518e+05, - "cpu_time": 5.5597683280506753e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3670472514206386e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7666527001377603e+05, - "cpu_time": 5.5568726505542104e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3687830422928312e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3048548902841412e+02, - "cpu_time": 6.7000810282507427e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8242428571211791e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1936552080388362e-03, - "cpu_time": 1.2051007583259992e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1931501812759099e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2363, - "real_time": 2.9307047516894632e+05, - "cpu_time": 5.8980355268724496e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4723713613403374e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2363, - "real_time": 2.9273652178223530e+05, - "cpu_time": 5.8969823952605936e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4774734359077877e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2363, - "real_time": 2.9545261018065689e+05, - "cpu_time": 5.8919141303432512e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4363121354675108e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2363, - "real_time": 2.9334511026892602e+05, - "cpu_time": 5.9020382945409440e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4681842448247695e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2363, - "real_time": 2.9274093112955603e+05, - "cpu_time": 5.8879682522217021e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4774059949270475e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9346912970606412e+05, - "cpu_time": 5.8953877198477881e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4663494344934905e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9307047516894632e+05, - "cpu_time": 5.8969823952605936e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4723713613403374e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1374850098579554e+03, - "cpu_time": 5.4976890455870989e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7232675363854563e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8759954445540816e-03, - "cpu_time": 9.3254070925279922e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8583356758356384e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2158, - "real_time": 3.2435444825496332e+05, - "cpu_time": 6.5224010519008606e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0820226579392564e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2158, - "real_time": 3.2497518409707729e+05, - "cpu_time": 6.5350165523632080e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0665851679829109e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2158, - "real_time": 3.2449584725969739e+05, - "cpu_time": 6.5244013855414989e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0785009180781126e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2158, - "real_time": 3.2489570279034291e+05, - "cpu_time": 6.5243047636702401e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0685585481308460e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2158, - "real_time": 3.2450556002250430e+05, - "cpu_time": 6.5291805282665440e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0782591207935059e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2464534848491702e+05, - "cpu_time": 6.5270608563484694e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0747852825849271e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2450556002250430e+05, - "cpu_time": 6.5244013855414977e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0782591207935059e+08, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7293917989244534e+02, - "cpu_time": 5.1031538636665300e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7872528027177532e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4073029589433967e-04, - "cpu_time": 7.8184560799720540e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4054901340299107e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1796, - "real_time": 3.9039695677764917e+05, - "cpu_time": 7.8455127951006102e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3429612882423377e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1796, - "real_time": 3.8910564156713273e+05, - "cpu_time": 7.8231650779517600e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3474181404525952e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1796, - "real_time": 3.9015990193014895e+05, - "cpu_time": 7.8463354342977784e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3437772498052974e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1796, - "real_time": 3.9031936251402798e+05, - "cpu_time": 7.8441200835191528e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3432282647293913e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1796, - "real_time": 3.9036007533741818e+05, - "cpu_time": 7.8441950111362070e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3430881719827971e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9006838762527535e+05, - "cpu_time": 7.8406656804011017e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3440946230424840e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9031936251402798e+05, - "cpu_time": 7.8441950111362070e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3432282647293913e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.4572947615354883e+02, - "cpu_time": 9.8272680915027070e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8837769224194249e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3990610197251142e-03, - "cpu_time": 1.2533716513468251e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4015210611849033e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1329, - "real_time": 5.2671420705547463e+05, - "cpu_time": 1.0582871474793667e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9907873870764260e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1329, - "real_time": 5.2488725774334930e+05, - "cpu_time": 1.0583679465763541e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9977166230099556e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1329, - "real_time": 5.2766000126342045e+05, - "cpu_time": 1.0588250316027044e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9872190378071237e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1329, - "real_time": 5.2528936616330780e+05, - "cpu_time": 1.0592293890143523e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9961873731782475e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1329, - "real_time": 5.2738623237034108e+05, - "cpu_time": 1.0581609014296504e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9882506133828483e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2638741291917872e+05, - "cpu_time": 1.0585740832204856e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9920322068909204e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2671420705547463e+05, - "cpu_time": 1.0583679465763543e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9907873870764260e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2429891418557497e+03, - "cpu_time": 4.4383116219905287e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7062356492806431e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3613580251900853e-03, - "cpu_time": 4.1927265104468777e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3625298993664046e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 895, - "real_time": 7.8247755592917849e+05, - "cpu_time": 1.5687281776536109e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.6801433269350052e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 895, - "real_time": 7.8165002782470104e+05, - "cpu_time": 1.5671544938548363e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.6829807782855010e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 895, - "real_time": 7.7163882699259161e+05, - "cpu_time": 1.5469973586592793e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7177896272709646e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 895, - "real_time": 7.7105050174228055e+05, - "cpu_time": 1.5459929608937907e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7198633491077886e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 895, - "real_time": 7.7173840508187539e+05, - "cpu_time": 1.5471505720668766e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7174389484705105e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7571106351412553e+05, - "cpu_time": 1.5552047126256791e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7036432060139542e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7173840508187539e+05, - "cpu_time": 1.5471505720668768e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7174389484705105e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8125441508199683e+03, - "cpu_time": 1.1648686482028925e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0203446628319636e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.4931819645422965e-03, - "cpu_time": 7.4901306480497009e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4726748645602761e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 524, - "real_time": 1.3300039028332976e+06, - "cpu_time": 2.6811680438931631e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1536027759504356e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 524, - "real_time": 1.3302460278185327e+06, - "cpu_time": 2.6833077080150810e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1530287723378730e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 524, - "real_time": 1.3303342786304767e+06, - "cpu_time": 2.6810735782440039e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1528196088563995e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 524, - "real_time": 1.3309132066939224e+06, - "cpu_time": 2.6830195152668948e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1514481777658005e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 524, - "real_time": 1.3299678585168601e+06, - "cpu_time": 2.6800184503815756e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1536882437725687e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3302930548986178e+06, - "cpu_time": 2.6817174591601440e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1529175157366161e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3302460278185327e+06, - "cpu_time": 2.6811680438931631e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1530287723378730e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8008577809908843e+02, - "cpu_time": 1.3988666946825551e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0062771212082962e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8571582532095147e-04, - "cpu_time": 5.2163090108704063e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8564899259992722e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 281, - "real_time": 2.5180617945593554e+06, - "cpu_time": 5.0512929181494005e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3313749559779778e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 281, - "real_time": 2.5139712128668916e+06, - "cpu_time": 5.0466989288253114e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3367955675330777e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 281, - "real_time": 2.5183265230011898e+06, - "cpu_time": 5.0506667046265714e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3310247592528086e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 281, - "real_time": 2.5145593985875412e+06, - "cpu_time": 5.0485125480421390e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3360150508721266e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 281, - "real_time": 2.5193560371354381e+06, - "cpu_time": 5.0521144946621051e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3296635633675766e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5168549932300840e+06, - "cpu_time": 5.0498571188611072e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3329747794007134e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5180617945593558e+06, - "cpu_time": 5.0506667046265723e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3313749559779778e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4219276346926072e+03, - "cpu_time": 2.2132967025895337e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2081083891913625e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.6228334218983005e-04, - "cpu_time": 4.3828897540940684e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6253605308354521e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 141, - "real_time": 4.9704282068984304e+06, - "cpu_time": 9.9027237801405508e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3754065649142647e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 141, - "real_time": 4.9638034881535154e+06, - "cpu_time": 9.9026786524825078e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3799114006104531e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 141, - "real_time": 4.9610313305512387e+06, - "cpu_time": 9.8973174751774669e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3818000496553650e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 141, - "real_time": 4.9636264741156539e+06, - "cpu_time": 9.9019840921987742e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3800319358215036e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 141, - "real_time": 4.9615793973735888e+06, - "cpu_time": 9.8994562411346436e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3814264886864491e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9640937794184862e+06, - "cpu_time": 9.9008320482267886e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3797152879376073e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9636264741156548e+06, - "cpu_time": 9.9019840921987742e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3800319358215036e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7459419662626451e+03, - "cpu_time": 2.3749142680308478e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5484436225429825e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.5460741329940394e-04, - "cpu_time": 2.3987017014960761e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5404091925687351e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 71, - "real_time": 9.8189944139039014e+06, - "cpu_time": 1.9575133957748130e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4172982064727750e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 71, - "real_time": 9.8398508058047630e+06, - "cpu_time": 1.9572887619716939e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4100549553256884e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 71, - "real_time": 9.8059691462508384e+06, - "cpu_time": 1.9557605140844189e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4218374032748227e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 71, - "real_time": 9.8655613952539340e+06, - "cpu_time": 1.9652587464787770e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4011680284248366e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 71, - "real_time": 9.8399770590411108e+06, - "cpu_time": 1.9586509070421301e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4100112021267076e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8340705640509110e+06, - "cpu_time": 1.9588944650703669e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4120739591249661e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8398508058047630e+06, - "cpu_time": 1.9575133957748134e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4100549553256884e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2786785168309339e+04, - "cpu_time": 3.7037373684597354e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9039273344028154e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3171264655765158e-03, - "cpu_time": 1.8907283850672836e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3164583854535774e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33, - "real_time": 2.1176470161387414e+07, - "cpu_time": 4.1714058121215209e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1690297527660880e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33, - "real_time": 2.1275801132574227e+07, - "cpu_time": 4.1863763666669637e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1542344084638605e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33, - "real_time": 2.1266123279929161e+07, - "cpu_time": 4.1801089757579267e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1556698471383801e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33, - "real_time": 2.1034549413756892e+07, - "cpu_time": 4.1588038787880793e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1904112933415089e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33, - "real_time": 2.1251408383250237e+07, - "cpu_time": 4.1805932787879519e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1578548955321627e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1200870474179588e+07, - "cpu_time": 4.1754576624244884e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1654400394484005e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1251408383250237e+07, - "cpu_time": 4.1801089757579274e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1578548955321627e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0085222219092457e+05, - "cpu_time": 1.0735378122906145e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5124539616504034e+07, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7569849697328180e-03, - "cpu_time": 2.5710662137746654e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7780212002182130e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18, - "real_time": 3.8921650499105453e+07, - "cpu_time": 7.7133515333331272e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4484079240957360e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18, - "real_time": 3.8965598369638123e+07, - "cpu_time": 7.7131223222232223e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4445185911627636e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18, - "real_time": 3.8954735216167241e+07, - "cpu_time": 7.7131856111110315e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4454791504858212e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18, - "real_time": 3.9009865373373032e+07, - "cpu_time": 7.7177267388884097e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4406098743322763e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18, - "real_time": 3.8975216241346464e+07, - "cpu_time": 7.7067393055560589e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4436685910575266e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8965413139926061e+07, - "cpu_time": 7.7128251022223696e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4445368262268243e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8965598369638130e+07, - "cpu_time": 7.7131856111110315e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4445185911627636e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2020786035152261e+04, - "cpu_time": 3.9229580427810826e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8305692779227290e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.2177458045073408e-04, - "cpu_time": 5.0862790103339990e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2175613753659863e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.5003192656570017e+07, - "cpu_time": 1.4612664966666165e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5789870603126388e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.4856472512086228e+07, - "cpu_time": 1.4600276299999374e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5860019446769781e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.5081573592291936e+07, - "cpu_time": 1.4645691333331949e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5752507993193984e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.4976806011464864e+07, - "cpu_time": 1.4616151733333835e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5802466159861889e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.4926462438371450e+07, - "cpu_time": 1.4617807288889000e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5826522067659831e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4968901442156911e+07, - "cpu_time": 1.4618518324444067e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5806277254122376e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4976806011464864e+07, - "cpu_time": 1.4616151733333835e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5802466159861889e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4223981693731374e+04, - "cpu_time": 1.6669672987142456e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0227204111049031e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1234522591839675e-03, - "cpu_time": 1.1403120765849841e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1234679278594279e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4651198089122772e+08, - "cpu_time": 2.8014349720001519e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6643481900540237e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4673800468444824e+08, - "cpu_time": 2.8038944420000005e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6587039135124569e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4657911956310272e+08, - "cpu_time": 2.7999135179998124e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6626697827099142e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4671181738376617e+08, - "cpu_time": 2.8026755959999716e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6593569732400122e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4656282961368561e+08, - "cpu_time": 2.8020889760000503e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6630768757337675e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4662075042724609e+08, - "cpu_time": 2.8020015007999980e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6616311470500355e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4657911956310272e+08, - "cpu_time": 2.8020889760000503e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6626697827099142e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8692087905188819e+04, - "cpu_time": 1.4769825391405664e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4643346380554731e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7311132713210537e-04, - "cpu_time": 5.2711696932313348e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7301553299295176e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.8743323683738708e+08, - "cpu_time": 5.1258771699997395e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7356216553601294e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8786613047122955e+08, - "cpu_time": 5.1268710850001752e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7300040204184904e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8804598748683929e+08, - "cpu_time": 5.1264221899998575e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7276749916506262e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.8824335336685181e+08, - "cpu_time": 5.1365268850008762e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7251225794387426e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8795926272869110e+08, - "cpu_time": 5.1233986750003171e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7287976563950853e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8790959417819977e+08, - "cpu_time": 5.1278192010001928e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7294441806526146e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8795926272869110e+08, - "cpu_time": 5.1264221899998581e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7287976563950853e+09, - "dst_gpu": 5.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0052899423514766e+05, - "cpu_time": 5.0494271666940564e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8954741279592654e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0438311202965232e-03, - "cpu_time": 9.8471240282987232e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0445186840891657e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2639, - "real_time": 2.6385958915962419e+05, - "cpu_time": 5.3108528836679109e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8808519457692406e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2639, - "real_time": 2.6512886834704585e+05, - "cpu_time": 5.3160905873443699e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8622727369681005e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2639, - "real_time": 2.6522691050562379e+05, - "cpu_time": 5.3160298560062540e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8608450328357136e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2639, - "real_time": 2.6439889389063418e+05, - "cpu_time": 5.3143040697233856e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8729360207670415e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2639, - "real_time": 2.6524206885909883e+05, - "cpu_time": 5.3174534710112063e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8606243889010171e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6477126615240535e+05, - "cpu_time": 5.3149461735506251e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8675060250482224e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6512886834704585e+05, - "cpu_time": 5.3160298560062540e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.8622727369681005e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1785158723717473e+02, - "cpu_time": 2.5464637505485197e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0375811318540182e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3335296016658105e-03, - "cpu_time": 4.7911374215241893e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3367982036282238e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2639, - "real_time": 2.6354165672107204e+05, - "cpu_time": 5.3050156385001331e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7710674869421795e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2639, - "real_time": 2.6503950339791767e+05, - "cpu_time": 5.3125784766952181e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7271500049757892e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2639, - "real_time": 2.6518331339770550e+05, - "cpu_time": 5.3172376847290585e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7229595397978025e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2639, - "real_time": 2.6449947103806119e+05, - "cpu_time": 5.3153768738159328e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7429266378581729e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2639, - "real_time": 2.6513923543142580e+05, - "cpu_time": 5.3141531413418858e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7242434401214216e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6468063599723647e+05, - "cpu_time": 5.3128723630164459e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7376694219390722e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6503950339791767e+05, - "cpu_time": 5.3141531413418858e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.7271500049757892e+06, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9315913671481201e+02, - "cpu_time": 4.7112495788549995e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0312341192648437e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6188509563731337e-03, - "cpu_time": 8.8676129538713989e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6251239339659116e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2637, - "real_time": 2.6345927049563039e+05, - "cpu_time": 5.3040926772842254e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5546995147653894e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2637, - "real_time": 2.6496402565411065e+05, - "cpu_time": 5.3113913045125641e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5458702327186864e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2637, - "real_time": 2.6506346705252043e+05, - "cpu_time": 5.3158563784602028e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5452902829451056e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2637, - "real_time": 2.6441266740408115e+05, - "cpu_time": 5.3149513993177109e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5490937103026174e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2637, - "real_time": 2.6487082120546402e+05, - "cpu_time": 5.3117179863482027e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5464142034817325e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6455405036236130e+05, - "cpu_time": 5.3116019491845812e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5482735888427064e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6487082120546402e+05, - "cpu_time": 5.3117179863482027e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5464142034817325e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6076867521731651e+02, - "cpu_time": 4.6304963262920529e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8761666576416064e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4976698497424536e-03, - "cpu_time": 8.7177020616217512e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5035411606671781e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2619, - "real_time": 2.6603076589342143e+05, - "cpu_time": 5.3490209774729167e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0793430874389622e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2619, - "real_time": 2.6684385142866959e+05, - "cpu_time": 5.3531335586103983e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0699601868809842e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2619, - "real_time": 2.6673937986769160e+05, - "cpu_time": 5.3506237075214519e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0711625722693838e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2619, - "real_time": 2.6613663710527902e+05, - "cpu_time": 5.3541250553642947e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0781181009510495e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2619, - "real_time": 2.6607823666343739e+05, - "cpu_time": 5.3444372699503752e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0787937047110200e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6636577419169981e+05, - "cpu_time": 5.3502681137838878e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0754755304502800e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6613663710527902e+05, - "cpu_time": 5.3506237075214530e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.0781181009510495e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9228536809603037e+02, - "cpu_time": 3.8329919157929373e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5269216718911208e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4727318826393513e-03, - "cpu_time": 7.1641118431392363e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4719420223214504e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2595, - "real_time": 2.7050706065575697e+05, - "cpu_time": 5.4213145202308288e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.0567735127808809e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2595, - "real_time": 2.6910743527634785e+05, - "cpu_time": 5.4004335221575690e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.0882747379964381e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2595, - "real_time": 2.6848913310140528e+05, - "cpu_time": 5.3915428285162966e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1022953930176198e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2595, - "real_time": 2.6860197082786378e+05, - "cpu_time": 5.3943736377650057e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.0997318632854894e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2595, - "real_time": 2.6790079732940521e+05, - "cpu_time": 5.3976476107903617e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1156966173021793e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6892127943815582e+05, - "cpu_time": 5.4010624238920130e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.0925544248765223e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6860197082786373e+05, - "cpu_time": 5.3976476107903617e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.0997318632854894e+07, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8481574996007748e+02, - "cpu_time": 1.1806422277599972e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2251699614158689e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6620967742590151e-03, - "cpu_time": 2.1859444218554781e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6522775280107018e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2542, - "real_time": 2.7279415038996103e+05, - "cpu_time": 5.4805749685287417e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2011987776555300e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2542, - "real_time": 2.7218926347624353e+05, - "cpu_time": 5.4790118174668774e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2038682048478363e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2542, - "real_time": 2.7281416144874535e+05, - "cpu_time": 5.4848537883556401e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2011106691085848e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2542, - "real_time": 2.7293268969492440e+05, - "cpu_time": 5.4846630448467552e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2005890550020608e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2542, - "real_time": 2.7226561910427379e+05, - "cpu_time": 5.4741282848150691e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2035305856025225e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7259917682282964e+05, - "cpu_time": 5.4806463808026176e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2020594584433070e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7279415038996103e+05, - "cpu_time": 5.4805749685287417e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2011987776555300e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4451183595214894e+02, - "cpu_time": 4.4440505361379337e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5197728098304695e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2638036547559259e-03, - "cpu_time": 8.1086248361221969e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2643075175321262e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2494, - "real_time": 2.8147929144161363e+05, - "cpu_time": 5.6608992742582969e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3282707464678243e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2494, - "real_time": 2.8097279158705781e+05, - "cpu_time": 5.6514041539697454e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3324678389613408e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2494, - "real_time": 2.8098504331943882e+05, - "cpu_time": 5.6611007377707725e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3323661368514609e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2494, - "real_time": 2.8091998255832912e+05, - "cpu_time": 5.6550604891742265e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3329063103010961e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2494, - "real_time": 2.8148191957351763e+05, - "cpu_time": 5.6538049679231178e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3282490079396826e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8116780569599144e+05, - "cpu_time": 5.6564539246192318e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3308520081042811e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8098504331943882e+05, - "cpu_time": 5.6550604891742265e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3323661368514609e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8659195481233667e+02, - "cpu_time": 4.3535279774059381e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3749828538328441e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0192915013968920e-03, - "cpu_time": 7.6965675587978885e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0189333538015806e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2343, - "real_time": 3.0026150435269694e+05, - "cpu_time": 5.9903848826283659e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.3652615503464127e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2343, - "real_time": 2.9801868802696507e+05, - "cpu_time": 5.9938487622700376e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.3981134494538957e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2343, - "real_time": 2.9821488688536134e+05, - "cpu_time": 5.9934866709350259e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.3952198821779883e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2343, - "real_time": 3.0097027673043002e+05, - "cpu_time": 5.9957032735806797e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.3549815424928898e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2343, - "real_time": 2.9771719526130240e+05, - "cpu_time": 5.9851272385836754e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4025673386100477e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9903651025135128e+05, - "cpu_time": 5.9917101655995590e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.3832287526162475e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9821488688536140e+05, - "cpu_time": 5.9934866709350259e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.3952198821779883e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4740829711027591e+03, - "cpu_time": 4.1462567843659889e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1564134190085167e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9294414580471728e-03, - "cpu_time": 6.9199889009502772e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9196917174842945e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2128, - "real_time": 3.3005868603400554e+05, - "cpu_time": 6.6368573402253608e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9423451371612024e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2128, - "real_time": 3.3020341712622589e+05, - "cpu_time": 6.6412165977451985e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9388639367045367e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2128, - "real_time": 3.3051726010094548e+05, - "cpu_time": 6.6339308740598219e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9313255809980047e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2128, - "real_time": 3.3070093888823991e+05, - "cpu_time": 6.6404461372185429e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9269203432346869e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2128, - "real_time": 3.3013552409895218e+05, - "cpu_time": 6.6356103712403495e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9404965798660016e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3032316524967377e+05, - "cpu_time": 6.6376122640978545e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9359903155928862e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3020341712622589e+05, - "cpu_time": 6.6368573402253608e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 7.9388639367045367e+08, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7380823735630781e+02, - "cpu_time": 3.1285849660603577e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5759413890332077e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.2891018905486289e-04, - "cpu_time": 4.7134192863035161e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2862265798290969e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1776, - "real_time": 3.9381688517866540e+05, - "cpu_time": 7.9096335529278149e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3312989354484966e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1776, - "real_time": 3.9383939645074302e+05, - "cpu_time": 7.9094722184692300e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3312228403883712e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1776, - "real_time": 3.9531859430746146e+05, - "cpu_time": 7.9396081418914499e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3262416884752753e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1776, - "real_time": 3.9561318329573178e+05, - "cpu_time": 7.9437828885131225e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3252541172473521e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1776, - "real_time": 3.9511408842601895e+05, - "cpu_time": 7.9358621283785324e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3269281338171456e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9474042953172408e+05, - "cpu_time": 7.9276717860360304e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3281891430753284e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9511408842601895e+05, - "cpu_time": 7.9358621283785324e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3269281338171456e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5152648151398296e+02, - "cpu_time": 1.6775935406683275e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8666717796357502e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1571808150589963e-03, - "cpu_time": 2.1161238582344901e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1583309836415120e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1287, - "real_time": 5.3217787006667291e+05, - "cpu_time": 1.0708487466977453e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9703487480015490e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1287, - "real_time": 5.3527035476189759e+05, - "cpu_time": 1.0717920497280622e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9589652045393662e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1287, - "real_time": 5.3228813799014187e+05, - "cpu_time": 1.0712819564879823e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9699405738390131e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1287, - "real_time": 5.3426720768758887e+05, - "cpu_time": 1.0697644560995270e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9626433831461194e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1287, - "real_time": 5.3251626819557429e+05, - "cpu_time": 1.0710318065268190e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9690966504236362e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3330396774037520e+05, - "cpu_time": 1.0709438031080272e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9661989119899368e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3251626819557440e+05, - "cpu_time": 1.0710318065268188e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9690966504236362e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3887931577109212e+03, - "cpu_time": 7.4858361704990023e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1133738664017124e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6041305554040397e-03, - "cpu_time": 6.9899430285455413e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6006391495897048e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 897, - "real_time": 7.7674062917405611e+05, - "cpu_time": 1.5567717179488102e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.6999385911227508e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 897, - "real_time": 7.7590673188279185e+05, - "cpu_time": 1.5550498171683028e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7028403206544094e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 897, - "real_time": 7.7600055302824476e+05, - "cpu_time": 1.5547416945373151e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7025135379300022e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 897, - "real_time": 7.7750103186334227e+05, - "cpu_time": 1.5577271950946124e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.6972980279833336e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 897, - "real_time": 7.7529956271026772e+05, - "cpu_time": 1.5532882931994139e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7049570267637482e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7628970173174073e+05, - "cpu_time": 1.5555157435896914e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7015095008908491e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7600055302824487e+05, - "cpu_time": 1.5550498171683028e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7025135379300022e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4872027282453382e+02, - "cpu_time": 1.7496973990851579e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9524933447918217e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0933035320850137e-03, - "cpu_time": 1.1248342591810420e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0929050383936122e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 523, - "real_time": 1.3354436123127521e+06, - "cpu_time": 2.6936935659655780e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1407570947426286e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 523, - "real_time": 1.3347763742229424e+06, - "cpu_time": 2.6923975334609672e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1423271201078682e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 523, - "real_time": 1.3342988221010419e+06, - "cpu_time": 2.6925248527721600e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1434517744649405e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 523, - "real_time": 1.3367401330908102e+06, - "cpu_time": 2.6954048948372100e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1377108356146469e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 523, - "real_time": 1.3364446180272512e+06, - "cpu_time": 2.6954723135757023e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1384046472432833e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3355407119509596e+06, - "cpu_time": 2.6938986321223234e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1405302944346733e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3354436123127523e+06, - "cpu_time": 2.6936935659655780e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1407570947426286e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0478058225532400e+03, - "cpu_time": 1.4939812340906367e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4638785720729013e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8455550862437139e-04, - "cpu_time": 5.5457960306161901e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8454220818666674e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 279, - "real_time": 2.5409345822175131e+06, - "cpu_time": 5.0810024301074836e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3013868435287032e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 279, - "real_time": 2.5305328256447255e+06, - "cpu_time": 5.0798006881716093e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3149571959663329e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 279, - "real_time": 2.5400881234916947e+06, - "cpu_time": 5.0789491541214427e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3024869973679194e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 279, - "real_time": 2.5307025399900251e+06, - "cpu_time": 5.0797057060932005e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3147348878201480e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 279, - "real_time": 2.5395886491863960e+06, - "cpu_time": 5.0801767311833734e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3031365149184480e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5363693441060707e+06, - "cpu_time": 5.0799269419354219e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3073404879203105e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5395886491863960e+06, - "cpu_time": 5.0798006881716093e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3031365149184480e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2728612009700464e+03, - "cpu_time": 7.4833545843445245e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8805347250806028e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0789011715596321e-03, - "cpu_time": 1.4731224818547117e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0803829391654663e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 138, - "real_time": 4.9885865503355209e+06, - "cpu_time": 9.9454549710136913e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3631201605335689e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 138, - "real_time": 4.9886131706391126e+06, - "cpu_time": 9.9449984782600906e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3631022142072802e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 138, - "real_time": 4.9842607324430048e+06, - "cpu_time": 9.9417822173899878e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3660389976783481e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 138, - "real_time": 5.0010040058227982e+06, - "cpu_time": 9.9540227028973140e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3547695583658509e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 138, - "real_time": 4.9838815862987787e+06, - "cpu_time": 9.9392164637674149e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3662950673070474e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9892692091078442e+06, - "cpu_time": 9.9450949666657001e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3626651996184192e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9885865503355209e+06, - "cpu_time": 9.9449984782600906e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3631201605335689e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9410586626929125e+03, - "cpu_time": 5.5985375651142622e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6716585590301864e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3911974623502185e-03, - "cpu_time": 5.6294460574581007e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3892725804401538e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 70, - "real_time": 9.8329917394689154e+06, - "cpu_time": 1.9685467671427302e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4124336609899654e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 70, - "real_time": 9.8590901653681491e+06, - "cpu_time": 1.9698816571430404e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4034004595947466e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 70, - "real_time": 9.8606535632695463e+06, - "cpu_time": 1.9673393600000314e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4028608534619470e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 70, - "real_time": 9.8279013564544059e+06, - "cpu_time": 1.9650849628568985e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4142011384722900e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 70, - "real_time": 9.7911856403308250e+06, - "cpu_time": 1.9577250071428612e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4270039638290691e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8343644929783680e+06, - "cpu_time": 1.9657155508571122e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4119800152696037e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time_median", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8329917394689135e+06, - "cpu_time": 1.9673393600000314e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4124336609899654e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8330831234265272e+04, - "cpu_time": 4.8024840825204476e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.8441111926755477e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8807993901886777e-03, - "cpu_time": 2.4431225974818269e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8851608592724122e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33, - "real_time": 2.1237892014059152e+07, - "cpu_time": 4.1848060272727571e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1598646398416085e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33, - "real_time": 2.1206037564711139e+07, - "cpu_time": 4.1794807999994271e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1646112007117977e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33, - "real_time": 2.1229746497490190e+07, - "cpu_time": 4.1839042151512772e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1610770297202420e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33, - "real_time": 2.1267016954494245e+07, - "cpu_time": 4.1937105424239866e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1555372407703018e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33, - "real_time": 2.1183040783260807e+07, - "cpu_time": 4.1784233636366427e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1680467732012558e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1224746762803108e+07, - "cpu_time": 4.1840649896968186e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1618273768490410e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time_median", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1229746497490190e+07, - "cpu_time": 4.1839042151512772e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1610770297202420e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1913895508731290e+04, - "cpu_time": 6.0509175404585534e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7542542938467227e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5036172570341889e-03, - "cpu_time": 1.4461815376574753e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5036413210466394e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18, - "real_time": 3.8912937045097351e+07, - "cpu_time": 7.7123279999998167e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4491800977256255e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18, - "real_time": 3.8975808148582779e+07, - "cpu_time": 7.7178906555546850e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4436162936849937e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18, - "real_time": 3.9082289362947144e+07, - "cpu_time": 7.7203045666667297e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4342340274274764e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18, - "real_time": 3.8940564211871892e+07, - "cpu_time": 7.7114707277777001e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4467330075068808e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18, - "real_time": 3.9091258827182978e+07, - "cpu_time": 7.7203791611118004e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4334460446351423e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9000571519136436e+07, - "cpu_time": 7.7164746222221464e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4414418941960244e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time_median", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8975808148582779e+07, - "cpu_time": 7.7178906555546850e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4436162936849937e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.1847260677182509e+04, - "cpu_time": 4.3055918356691036e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2196024925033096e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0986169558315951e-03, - "cpu_time": 5.5797395137796796e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0978423330869351e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.4816804793145925e+07, - "cpu_time": 1.4610083588887492e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5879032356724191e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.4940841231081218e+07, - "cpu_time": 1.4628298288888195e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5819648083783207e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.4950728151533335e+07, - "cpu_time": 1.4636900966666469e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5814923032806902e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.5042728748586446e+07, - "cpu_time": 1.4627699611110580e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5771014790697684e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.4951954185962677e+07, - "cpu_time": 1.4632618488889825e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5814337186457739e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4940611422061935e+07, - "cpu_time": 1.4627120188888514e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5819791090093942e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time_median", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4950728151533335e+07, - "cpu_time": 1.4628298288888195e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5814923032806902e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0602557431756257e+04, - "cpu_time": 1.0220864762618019e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8542569172280147e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0755524394884706e-03, - "cpu_time": 6.9876124832708318e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0760132317728451e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4679051637649536e+08, - "cpu_time": 2.8034769779997075e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6573950773700376e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4679080545902252e+08, - "cpu_time": 2.8051083999998808e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6573878746776857e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4657138288021088e+08, - "cpu_time": 2.8021017599999142e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6628631145465221e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4669031500816345e+08, - "cpu_time": 2.8021202340000856e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6598933744884429e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4647422432899475e+08, - "cpu_time": 2.8019367699998838e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6652927466209884e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4666344881057739e+08, - "cpu_time": 2.8029488283998948e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6605664375407357e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time_median", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4669031500816345e+08, - "cpu_time": 2.8021202340000856e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6598933744884429e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3907706024542107e+05, - "cpu_time": 1.3574836323256436e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4722659695363198e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.4827348854345777e-04, - "cpu_time": 4.8430553514620657e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4855974581602707e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.9247023165225983e+08, - "cpu_time": 5.2006779250007182e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6712858533809814e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.9323415458202362e+08, - "cpu_time": 5.2121152649999660e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6617215533112545e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.9262797534465790e+08, - "cpu_time": 5.2065230300001985e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6693068143445425e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.9285678267478943e+08, - "cpu_time": 5.2048018050004429e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6664400059067950e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.9310245811939240e+08, - "cpu_time": 5.2108363150000513e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6633668338687963e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9285832047462463e+08, - "cpu_time": 5.2069908680002755e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6664242121624742e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time_median", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9285678267478943e+08, - "cpu_time": 5.2065230300001985e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.6664400059067950e+09, - "dst_gpu": 6.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1801283138721698e+05, - "cpu_time": 4.6344100431813736e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9814495608308287e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0858931065090632e-03, - "cpu_time": 8.9003613808164809e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0859216856640142e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2672, - "real_time": 2.6074612651427742e+05, - "cpu_time": 5.2164063248500240e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9271916085163006e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2672, - "real_time": 2.5941018859026633e+05, - "cpu_time": 5.2117437013478793e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9474162736814837e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2672, - "real_time": 2.6070695572114803e+05, - "cpu_time": 5.2164031399702787e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9277816626237989e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2672, - "real_time": 2.6062971233612648e+05, - "cpu_time": 5.2151687799397751e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9289457476719976e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2672, - "real_time": 2.5998611624187423e+05, - "cpu_time": 5.2153430613769620e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9386718598747668e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6029581988073853e+05, - "cpu_time": 5.2150130014969839e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9340014304736699e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time_median", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6062971233612642e+05, - "cpu_time": 5.2153430613769620e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 3.9289457476719976e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.8385615560296708e+02, - "cpu_time": 1.9167266922531070e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8372796275675428e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2430485279036610e-03, - "cpu_time": 3.6754015602701381e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2463844469175747e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2669, - "real_time": 2.6074989167172581e+05, - "cpu_time": 5.2204604608464456e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8542698018772490e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2669, - "real_time": 2.6024627786634976e+05, - "cpu_time": 5.2208974334958068e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8694689383867234e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2669, - "real_time": 2.6074054388995163e+05, - "cpu_time": 5.2164775608838937e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8545513844765946e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2669, - "real_time": 2.6047137776278405e+05, - "cpu_time": 5.2180383626827440e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8626681272640647e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2669, - "real_time": 2.6017787637345702e+05, - "cpu_time": 5.2174259910078469e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8715378438261934e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6047719351285364e+05, - "cpu_time": 5.2186599617833475e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8624992191661661e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time_median", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6047137776278408e+05, - "cpu_time": 5.2180383626827446e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 7.8626681272640647e+06, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6770520898289612e+02, - "cpu_time": 1.9313220552122445e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0807431093445084e+03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0277491298664725e-03, - "cpu_time": 3.7008007215558512e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0277575722546764e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2648, - "real_time": 2.6007377119142961e+05, - "cpu_time": 5.2110330060424557e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5749377498683261e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2648, - "real_time": 2.6021238637217984e+05, - "cpu_time": 5.2186180249244958e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5740987802715594e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2648, - "real_time": 2.6041721631727094e+05, - "cpu_time": 5.2128412160120998e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5728606802285185e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2648, - "real_time": 2.5970870288675564e+05, - "cpu_time": 5.2065303436561103e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5771516142784152e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2648, - "real_time": 2.5971327751871056e+05, - "cpu_time": 5.2121220468272851e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5771238340731006e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6002507085726931e+05, - "cpu_time": 5.2122289274924889e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5752345317439839e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time_median", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6007377119142958e+05, - "cpu_time": 5.2121220468272845e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 1.5749377498683261e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1166515093405053e+02, - "cpu_time": 4.3333293363824339e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8879784586049307e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1985965426584847e-03, - "cpu_time": 8.3137740046792630e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1985380085051207e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2652, - "real_time": 2.6189907699383353e+05, - "cpu_time": 5.2547311236808391e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1279224402126785e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2652, - "real_time": 2.6183952254548369e+05, - "cpu_time": 5.2479933634986030e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1286338748104699e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2652, - "real_time": 2.6247730019874941e+05, - "cpu_time": 5.2554378846153698e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1210317973390337e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2652, - "real_time": 2.6265039529623662e+05, - "cpu_time": 5.2559302450979024e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1189749365351059e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2652, - "real_time": 2.6124935364482368e+05, - "cpu_time": 5.2456778846154630e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1357015379020877e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6202312973582541e+05, - "cpu_time": 5.2519541003016359e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1264529173598751e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time_median", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6189907699383359e+05, - "cpu_time": 5.2547311236808391e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 3.1279224402126785e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.5847180207656379e+02, - "cpu_time": 4.7627895915995020e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6663669689016140e+04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1313836020492587e-03, - "cpu_time": 9.0686047528975178e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1322460772993219e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2626, - "real_time": 2.6467991815725667e+05, - "cpu_time": 5.3118429245996103e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1901182810044646e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2626, - "real_time": 2.6467248313712358e+05, - "cpu_time": 5.3046194211728126e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1902921700823925e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2626, - "real_time": 2.6571225209224771e+05, - "cpu_time": 5.3159506016755197e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1660686968668438e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2626, - "real_time": 2.6480878907621477e+05, - "cpu_time": 5.3042907463825797e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1871058196956262e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2626, - "real_time": 2.6478935076528130e+05, - "cpu_time": 5.3118562147753674e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1875600180474624e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6493255864562478e+05, - "cpu_time": 5.3097119817211793e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1842289971393585e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time_median", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6478935076528130e+05, - "cpu_time": 5.3118429245996103e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 6.1875600180474624e+07, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4023168912831397e+02, - "cpu_time": 5.0838714916919014e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0254438609999574e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6616745460763477e-03, - "cpu_time": 9.5746652722280613e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6581595886476673e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2565, - "real_time": 2.6920745269527938e+05, - "cpu_time": 5.3951954346976650e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2172025578017958e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2565, - "real_time": 2.6847606952135137e+05, - "cpu_time": 5.3938438791422790e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2205184640262333e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2565, - "real_time": 2.6983435579564708e+05, - "cpu_time": 5.4018636218329426e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2143746448957042e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2565, - "real_time": 2.7013246424325521e+05, - "cpu_time": 5.4028404951262311e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2130345048232448e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2565, - "real_time": 2.6930158308364055e+05, - "cpu_time": 5.3933168849903136e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2167771026367418e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6939038506783475e+05, - "cpu_time": 5.3974120631578867e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2163814548367441e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time_median", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6930158308364055e+05, - "cpu_time": 5.3951954346976650e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.2167771026367418e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3739988892375470e+02, - "cpu_time": 4.5743882478586409e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8798851030466479e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3660825488008869e-03, - "cpu_time": 8.4751510433729680e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3675838624431923e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2514, - "real_time": 2.7910660571317200e+05, - "cpu_time": 5.5885070167069428e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3480633800315365e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2514, - "real_time": 2.7831620334152301e+05, - "cpu_time": 5.5786889896585280e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3547317480319497e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2514, - "real_time": 2.7713611401641974e+05, - "cpu_time": 5.5711814558476675e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3647585675577858e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2514, - "real_time": 2.7777866736649373e+05, - "cpu_time": 5.5760661336510524e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3592884443330404e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2514, - "real_time": 2.7720739968151058e+05, - "cpu_time": 5.5713017223549879e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3641504546882835e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7790899802382378e+05, - "cpu_time": 5.5771490636438353e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3581985189285195e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time_median", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7777866736649373e+05, - "cpu_time": 5.5760661336510524e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 2.3592884443330404e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2259594446927872e+02, - "cpu_time": 7.1125057157391279e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9711415061666910e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9599471421172248e-03, - "cpu_time": 1.2752941753169072e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9561300502105848e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2379, - "real_time": 2.9682781763451931e+05, - "cpu_time": 5.9199157124833984e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4157586389489770e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2379, - "real_time": 2.9454508621833619e+05, - "cpu_time": 5.9213881504830217e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4499808733132559e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2379, - "real_time": 2.9399366619446309e+05, - "cpu_time": 5.9166597604037262e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4583273407428437e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2379, - "real_time": 2.9689218232759711e+05, - "cpu_time": 5.9193506052963703e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4148013252626634e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2379, - "real_time": 2.9466366805670573e+05, - "cpu_time": 5.9262350189155573e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4481900623994213e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9538448408632429e+05, - "cpu_time": 5.9207098495164153e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4374116481334329e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time_median", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9466366805670568e+05, - "cpu_time": 5.9199157124833984e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 4.4481900623994213e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3706663211512023e+03, - "cpu_time": 3.5308996497760955e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0565172866280507e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6402786706651574e-03, - "cpu_time": 5.9636424339633667e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6344974271050800e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2138, - "real_time": 3.2672788440885843e+05, - "cpu_time": 6.5706769644525507e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0233127476796591e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2138, - "real_time": 3.2617162131827226e+05, - "cpu_time": 6.5661395135636011e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0369959514106429e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2138, - "real_time": 3.2654588425850408e+05, - "cpu_time": 6.5623247053323919e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0277845361688423e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2138, - "real_time": 3.2589764568562224e+05, - "cpu_time": 6.5654538821333891e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0437524931639934e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2138, - "real_time": 3.2606685747946997e+05, - "cpu_time": 6.5658078811966674e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0395782026545048e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2628197863014543e+05, - "cpu_time": 6.5660805893357203e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0342847862155294e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time_median", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2617162131827226e+05, - "cpu_time": 6.5658078811966663e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 8.0369959514106429e+08, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4447271372725857e+02, - "cpu_time": 2.9876383891480765e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4800800326412020e+05, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0557515777410834e-03, - "cpu_time": 4.5501092295462234e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0554866124724040e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1797, - "real_time": 3.9041892435058590e+05, - "cpu_time": 7.8473760990544606e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3428857242821643e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1797, - "real_time": 3.8946915825589991e+05, - "cpu_time": 7.8348276794665877e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3461605081846242e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1797, - "real_time": 3.8952372623744857e+05, - "cpu_time": 7.8304161602675170e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3459719259319286e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1797, - "real_time": 3.8901204031137528e+05, - "cpu_time": 7.8174400278246868e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3477423464331498e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1797, - "real_time": 3.9064961600036535e+05, - "cpu_time": 7.8486670728984708e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3420927053964124e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8981469303113502e+05, - "cpu_time": 7.8357454079023446e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3449706420456560e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time_median", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8952372623744851e+05, - "cpu_time": 7.8348276794665889e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 1.3459719259319286e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9110404359000029e+02, - "cpu_time": 1.2909032192293112e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3838046007842170e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7729040386243239e-03, - "cpu_time": 1.6474542650753250e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7723841147629280e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1295, - "real_time": 5.3498541314198019e+05, - "cpu_time": 1.0740108741311433e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9600085801250019e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1295, - "real_time": 5.3163317052834458e+05, - "cpu_time": 1.0722644038610815e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9723675235649996e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1295, - "real_time": 5.3370614261024818e+05, - "cpu_time": 1.0713848231660654e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9647066358869846e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1295, - "real_time": 5.3147824942296126e+05, - "cpu_time": 1.0722930169884204e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9729424508688061e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1295, - "real_time": 5.3457546364300267e+05, - "cpu_time": 1.0724755783783789e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9615116504865520e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3327568786930735e+05, - "cpu_time": 1.0724857393050180e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9663073681864691e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time_median", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3370614261024818e+05, - "cpu_time": 1.0722930169884204e+06, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 1.9647066358869846e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6375680930361405e+03, - "cpu_time": 9.5187802484191275e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0412289437961215e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0707720795954746e-03, - "cpu_time": 8.8754375928461269e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0723726318372920e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 905, - "real_time": 7.7113747829571366e+05, - "cpu_time": 1.5461622961324968e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7195565758714037e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 905, - "real_time": 7.7056270735904330e+05, - "cpu_time": 1.5449272453038774e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7215851221084766e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 905, - "real_time": 7.7026728347705374e+05, - "cpu_time": 1.5448210187846271e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7226289432069254e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 905, - "real_time": 7.7188320731929399e+05, - "cpu_time": 1.5481394331491375e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7169291676694045e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 905, - "real_time": 7.7176845705815847e+05, - "cpu_time": 1.5466160011049735e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7173331338183517e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7112382670185273e+05, - "cpu_time": 1.5461331988950227e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7196065885349126e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time_median", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7113747829571366e+05, - "cpu_time": 1.5461622961324968e+06, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 2.7195565758714037e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1430294652835028e+02, - "cpu_time": 1.3633654324037973e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5193701081976821e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.2631419467800779e-04, - "cpu_time": 8.8179041325686289e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2637299777792470e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 523, - "real_time": 1.3314050715327633e+06, - "cpu_time": 2.6861300305928695e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1502839291211052e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 523, - "real_time": 1.3317131814876318e+06, - "cpu_time": 2.6870734053539154e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1495550680925317e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 523, - "real_time": 1.3307146107008676e+06, - "cpu_time": 2.6850540210323199e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1519185002341876e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 523, - "real_time": 1.3314166972609540e+06, - "cpu_time": 2.6874253613766693e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1502564213207612e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 523, - "real_time": 1.3302327819296781e+06, - "cpu_time": 2.6843989980880450e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1530601688492513e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3310964685823792e+06, - "cpu_time": 2.6860163632887644e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1510148175235672e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time_median", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3314050715327633e+06, - "cpu_time": 2.6861300305928690e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 3.1502839291211052e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.0619449645138877e+02, - "cpu_time": 1.2901072242230334e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4352992331357249e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5540989008631909e-04, - "cpu_time": 4.8030505020580868e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5550380314103047e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 280, - "real_time": 2.5296478906446802e+06, - "cpu_time": 5.0631762107140534e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3161168520817990e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 280, - "real_time": 2.5252101302612573e+06, - "cpu_time": 5.0613376178570697e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3219445381886368e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 280, - "real_time": 2.5299513413171684e+06, - "cpu_time": 5.0649473464285880e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3157191061361046e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 280, - "real_time": 2.5258678518834389e+06, - "cpu_time": 5.0622851785712037e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3210795227252088e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 280, - "real_time": 2.5290987429408622e+06, - "cpu_time": 5.0620113785717934e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3168368864260473e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5279551914094812e+06, - "cpu_time": 5.0627515464285417e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3183393811115594e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time_median", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5290987429408622e+06, - "cpu_time": 5.0622851785712037e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 3.3168368864260473e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2388558609391102e+03, - "cpu_time": 1.3934147598853076e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9397491441277773e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.8563906059221660e-04, - "cpu_time": 2.7522874608932284e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.8590972968624929e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 140, - "real_time": 4.9713958320873128e+06, - "cpu_time": 9.9145469928560350e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3747495807341180e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 140, - "real_time": 4.9734358542731833e+06, - "cpu_time": 9.9153800500013325e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3733653135558171e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 140, - "real_time": 4.9748118235064400e+06, - "cpu_time": 9.9156342500009481e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3724322839159708e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 140, - "real_time": 4.9714861404416813e+06, - "cpu_time": 9.9149746500009820e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3746882775196600e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 140, - "real_time": 4.9765147401818205e+06, - "cpu_time": 9.9150333357134257e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3712782692143764e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9735288780980874e+06, - "cpu_time": 9.9151138557145465e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3733027449879889e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time_median", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.9734358542731823e+06, - "cpu_time": 9.9150333357134257e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 3.3733653135558171e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1961692306736882e+03, - "cpu_time": 4.1498939189568927e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4893919502400972e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.4157162539961337e-04, - "cpu_time": 4.1854223555538037e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4152335643547476e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 70, - "real_time": 9.8395475053361487e+06, - "cpu_time": 1.9560429657141346e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4101600690278573e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 70, - "real_time": 9.8343155213764738e+06, - "cpu_time": 1.9576299414286170e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4119743186055017e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 70, - "real_time": 9.8598243003445007e+06, - "cpu_time": 1.9596857828573126e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4031470519031067e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 70, - "real_time": 9.8684185450630523e+06, - "cpu_time": 1.9644872542858139e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4001833066541877e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 70, - "real_time": 9.8492893390357494e+06, - "cpu_time": 1.9563037842856701e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4067871137680473e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8502790422311835e+06, - "cpu_time": 1.9588299457143094e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4064503719917402e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time_median", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8492893390357494e+06, - "cpu_time": 1.9576299414286170e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 3.4067871137680473e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4063542495994683e+04, - "cpu_time": 3.4758580543980948e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8625421557370583e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4277303653734009e-03, - "cpu_time": 1.7744562574218679e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4274513422292854e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 33, - "real_time": 2.1189572910467785e+07, - "cpu_time": 4.1787637272729188e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1670701567962136e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 33, - "real_time": 2.1246780556711283e+07, - "cpu_time": 4.1839827848482884e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1585427176072621e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 33, - "real_time": 2.1291658395167552e+07, - "cpu_time": 4.1877974545451999e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1518852479443932e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 33, - "real_time": 2.1257825647339676e+07, - "cpu_time": 4.1836814303031027e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1569016094737978e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 33, - "real_time": 2.1261267984906834e+07, - "cpu_time": 4.1845346090908743e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1563904865711646e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1249421098918628e+07, - "cpu_time": 4.1837520012120768e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1581580436785665e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time_median", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1257825647339676e+07, - "cpu_time": 4.1839827848482884e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 3.1569016094737978e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7362255218318918e+04, - "cpu_time": 3.2372552417033487e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5593296721673198e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7582716745267130e-03, - "cpu_time": 7.7376843578813505e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7603076208598831e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 18, - "real_time": 3.8993898986114398e+07, - "cpu_time": 7.7111083833326831e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4420186616320291e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 18, - "real_time": 3.8986174596680537e+07, - "cpu_time": 7.7175363222219557e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4427006339685330e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 18, - "real_time": 3.8956317636701792e+07, - "cpu_time": 7.7098065500005454e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4453391938038278e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 18, - "real_time": 3.8946494667066470e+07, - "cpu_time": 7.7161196166672289e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4462081670599179e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 18, - "real_time": 3.8915330751074687e+07, - "cpu_time": 7.7116932000005066e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4489679365321455e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8959643327527583e+07, - "cpu_time": 7.7132528144445866e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4450469185992908e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time_median", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8956317636701800e+07, - "cpu_time": 7.7116932000005066e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 3.4453391938038278e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1721090423932095e+04, - "cpu_time": 3.3717471161264635e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8055167184673841e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.1420382002108922e-04, - "cpu_time": 4.3713686005626614e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1436241211137672e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.4908275571134359e+07, - "cpu_time": 1.4603226711109427e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5835220334913259e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.4845557411511734e+07, - "cpu_time": 1.4599499955554369e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5865249092087445e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.4889982740084335e+07, - "cpu_time": 1.4624674155556428e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5843973543383102e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.4806640545527145e+07, - "cpu_time": 1.4599850066666576e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5883907370045691e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.4733859135044947e+07, - "cpu_time": 1.4597555855556896e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5918853797571731e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4836863080660507e+07, - "cpu_time": 1.4604961348888740e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5869440827600245e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time_median", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4845557411511749e+07, - "cpu_time": 1.4599850066666576e+08, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 3.5865249092087445e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9857440254834917e+04, - "cpu_time": 1.1207107895081797e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3496707989651761e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.3346296703459241e-04, - "cpu_time": 7.6734937035177590e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3385085512337420e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4673151671886444e+08, - "cpu_time": 2.8030292200000989e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6588656888801689e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4641747176647186e+08, - "cpu_time": 2.7990454900000256e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6667134428893895e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4675283133983612e+08, - "cpu_time": 2.8033453339999139e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6583342692500825e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4661936163902283e+08, - "cpu_time": 2.8029780239999127e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6616645032310076e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4651193618774414e+08, - "cpu_time": 2.8015225340000141e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6643493081139812e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4660662353038791e+08, - "cpu_time": 2.8019841203999931e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6619854424729266e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time_median", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4661936163902283e+08, - "cpu_time": 2.8029780239999127e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 3.6616645032310076e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4307460826912886e+05, - "cpu_time": 1.7875675256322889e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5745202146302098e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.7590821494823569e-04, - "cpu_time": 6.3796490230540886e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7611535348331375e-04, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2, - "real_time": 2.9009360074996948e+08, - "cpu_time": 5.1590798749998611e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7013633572891316e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2, - "real_time": 2.8925877809524536e+08, - "cpu_time": 5.1534569300008571e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7120457711621976e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2, - "real_time": 2.8987127542495728e+08, - "cpu_time": 5.1638824250005656e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7042022270950174e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2, - "real_time": 2.9001134634017944e+08, - "cpu_time": 5.1633901549996608e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7024131557270699e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2, - "real_time": 2.8941406309604645e+08, - "cpu_time": 5.1551887800007987e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7100540744755120e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8972981274127960e+08, - "cpu_time": 5.1589996330003488e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7060157171497860e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time_median", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8987127542495728e+08, - "cpu_time": 5.1590798749998605e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 3.7042022270950174e+09, - "dst_gpu": 7.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7188239057396376e+05, - "cpu_time": 4.7002376824083709e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7587164376289537e+06, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToGPU/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2835489280699048e-03, - "cpu_time": 9.1107540546088905e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2840518769544713e-03, - "dst_gpu": 0.0000000000000000e+00, - "src_gpu": NaN - } - ] -} diff --git a/results/prefetch_managed_GPUToHost.json b/results/prefetch_managed_GPUToHost.json deleted file mode 100644 index 9c86902..0000000 --- a/results/prefetch_managed_GPUToHost.json +++ /dev/null @@ -1,27928 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:04:31-04:00", - "host_name": "frontier10439", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1813, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [1.43,9.37,13.09], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3520, - "real_time": 1.9891961827108223e+05, - "cpu_time": 2.7717179090909089e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1478079884736193e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3520, - "real_time": 1.9896811985828125e+05, - "cpu_time": 2.7690095056818164e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1465531298650410e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3520, - "real_time": 1.9856175645972227e+05, - "cpu_time": 2.7687723835227260e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1570857261615517e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3520, - "real_time": 1.9884042853846037e+05, - "cpu_time": 2.7673407727272704e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1498581426660642e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3520, - "real_time": 1.9903523016595998e+05, - "cpu_time": 2.7690991278409067e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1448178251969069e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9886503065870126e+05, - "cpu_time": 2.7691879397727258e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1492245624726368e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9891961827108223e+05, - "cpu_time": 2.7690095056818158e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1478079884736193e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8381755006050855e+02, - "cpu_time": 1.5831285584781969e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7634516345407956e+03, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.2433319951551625e-04, - "cpu_time": 5.7169415471603141e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2508135482314354e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3535, - "real_time": 1.9901998707371904e+05, - "cpu_time": 2.7667123451202275e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0290423741417488e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3535, - "real_time": 1.9899903017519732e+05, - "cpu_time": 2.7669991258840135e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0291507442005903e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3535, - "real_time": 1.9889146843207197e+05, - "cpu_time": 2.7719896492220653e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0297073153238144e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3535, - "real_time": 1.9842640100286738e+05, - "cpu_time": 2.7694707751060789e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0321207206547102e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3535, - "real_time": 1.9901656590404102e+05, - "cpu_time": 2.7693716633663338e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0290600637674933e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9887069051757935e+05, - "cpu_time": 2.7689087117397442e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0298162436176715e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9899903017519729e+05, - "cpu_time": 2.7693716633663338e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0291507442005903e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5390207383158139e+02, - "cpu_time": 2.1501720674278894e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3168191971743407e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2767194259283646e-03, - "cpu_time": 7.7654133497124438e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2786933643117223e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3537, - "real_time": 1.9899866315405205e+05, - "cpu_time": 2.7780435736499855e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0583052846084390e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3537, - "real_time": 1.9904652026024164e+05, - "cpu_time": 2.7743171840542834e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0578104026358865e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3537, - "real_time": 1.9887009404135850e+05, - "cpu_time": 2.7691685298275354e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0596359748028107e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3537, - "real_time": 1.9836235735376499e+05, - "cpu_time": 2.7713604664970242e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0649079062390242e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3537, - "real_time": 1.9892979613500697e+05, - "cpu_time": 2.7730458835171023e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0590178442751646e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9884148618888485e+05, - "cpu_time": 2.7731871275091858e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0599354825122654e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9892979613500697e+05, - "cpu_time": 2.7730458835171029e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0590178442751646e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7610010197729372e+02, - "cpu_time": 3.3304603495614521e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8648853466096596e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3885437454184929e-03, - "cpu_time": 1.2009504575166536e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3907645996347855e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3487, - "real_time": 1.9948982506050830e+05, - "cpu_time": 2.7913842701462639e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1064751034371011e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3487, - "real_time": 2.0005926075849522e+05, - "cpu_time": 2.7926767507886421e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0947866991716549e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3487, - "real_time": 1.9991802138833003e+05, - "cpu_time": 2.7933024806423899e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0976796104276560e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3487, - "real_time": 1.9949459374023872e+05, - "cpu_time": 2.7951626613134489e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1063769430598088e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3487, - "real_time": 2.0015231279054281e+05, - "cpu_time": 2.8005671924290230e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0928830078385539e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9982280274762303e+05, - "cpu_time": 2.7946186710639537e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0996402727869548e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9991802138833000e+05, - "cpu_time": 2.7933024806423899e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0976796104276560e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1310986150400680e+02, - "cpu_time": 3.5932434061512339e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4257225218744854e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5669375927003975e-03, - "cpu_time": 1.2857723464587145e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5673869155125285e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3467, - "real_time": 2.0075515439949569e+05, - "cpu_time": 2.8206247274300468e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1611852253598511e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3467, - "real_time": 2.0123110024764450e+05, - "cpu_time": 2.8179409114508214e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1418826313810721e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3467, - "real_time": 2.0108189455420611e+05, - "cpu_time": 2.8148551341217203e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1479240268364027e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3467, - "real_time": 2.0085557526512592e+05, - "cpu_time": 2.8164188289587543e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1571049140027106e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3467, - "real_time": 2.0115148433538401e+05, - "cpu_time": 2.8217255667724239e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1451051947907180e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0101504176037124e+05, - "cpu_time": 2.8183130337467539e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1506403984741509e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0108189455420614e+05, - "cpu_time": 2.8179409114508214e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1479240268364027e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0170408133457272e+02, - "cpu_time": 2.8580091818570247e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1807544616923929e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0034278010648716e-03, - "cpu_time": 1.0140850741684635e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0036946867664385e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3433, - "real_time": 2.0268892462018353e+05, - "cpu_time": 2.8650943227497838e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6166645543856716e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3433, - "real_time": 2.0308961008425540e+05, - "cpu_time": 2.8639802301194269e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6134749575030252e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3433, - "real_time": 2.0314138002110794e+05, - "cpu_time": 2.8674347888144356e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6130637685239291e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3433, - "real_time": 2.0268816977296190e+05, - "cpu_time": 2.8681093766385113e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6166705751354203e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3433, - "real_time": 2.0321617884915584e+05, - "cpu_time": 2.8685799912612973e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6124700398152438e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0296485266953293e+05, - "cpu_time": 2.8666397419166908e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6144687790726581e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0308961008425543e+05, - "cpu_time": 2.8674347888144356e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6134749575030252e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5621323182250137e+02, - "cpu_time": 2.0011132341119745e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0387514377677333e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2623527101003414e-03, - "cpu_time": 6.9806931260012152e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2628001632455108e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3373, - "real_time": 2.0640489349328505e+05, - "cpu_time": 2.9662954372961767e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1751185202463269e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3373, - "real_time": 2.0681578238983272e+05, - "cpu_time": 2.9614654965905676e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1688103897443086e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3373, - "real_time": 2.0655151904843503e+05, - "cpu_time": 2.9621728135191213e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1728645861293435e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3373, - "real_time": 2.0611448700845835e+05, - "cpu_time": 2.9629972220575262e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1795921262589651e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3373, - "real_time": 2.0676284197000982e+05, - "cpu_time": 2.9629609190631576e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1696217451637536e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0652990478200425e+05, - "cpu_time": 2.9631783777053107e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1732014735085392e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0655151904843506e+05, - "cpu_time": 2.9629609190631576e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1728645861293435e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8489149935664040e+02, - "cpu_time": 1.8534621092319617e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3796425520811626e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3794200876495256e-03, - "cpu_time": 6.2549798661371361e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3801968102701932e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3298, - "real_time": 2.1230788462896412e+05, - "cpu_time": 3.1243159611886012e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1736755669279790e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3298, - "real_time": 2.1225534579061478e+05, - "cpu_time": 3.1277960430563882e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1752037156840158e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3298, - "real_time": 2.1220333481879861e+05, - "cpu_time": 3.1183281655548816e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1767172562072587e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3298, - "real_time": 2.1201063224183381e+05, - "cpu_time": 3.1272406306852645e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1823314526268816e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3298, - "real_time": 2.1238148007541191e+05, - "cpu_time": 3.1262665949060000e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1715362353374350e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1223173551112466e+05, - "cpu_time": 3.1247894790782273e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1758928453567135e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1225534579061478e+05, - "cpu_time": 3.1262665949060000e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1752037156840158e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4006500543402279e+02, - "cpu_time": 3.8471493978329966e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0775786648451065e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.5996258804885922e-04, - "cpu_time": 1.2311707472107386e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6024116139106837e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3053, - "real_time": 2.2830810246614984e+05, - "cpu_time": 3.4382458336062985e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1482027889871619e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3053, - "real_time": 2.2857103742852190e+05, - "cpu_time": 3.4455092302653159e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1468819626020072e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3053, - "real_time": 2.2796053892227856e+05, - "cpu_time": 3.4425127874222177e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1499534140396817e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3053, - "real_time": 2.2842030913863101e+05, - "cpu_time": 3.4446199410415889e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1476387585173159e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3053, - "real_time": 2.2852910138747314e+05, - "cpu_time": 3.4417855322633579e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1470924202144938e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2835781786861093e+05, - "cpu_time": 3.4425346649197559e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1479538688721321e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2842030913863104e+05, - "cpu_time": 3.4425127874222177e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1476387585173159e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4444220473389510e+02, - "cpu_time": 2.8351440834307465e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2298895763116297e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0704350173574464e-03, - "cpu_time": 8.2356297303888808e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0713754356000383e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2731, - "real_time": 2.5600025340207454e+05, - "cpu_time": 4.1548620358842844e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0479979727854104e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2731, - "real_time": 2.5601396407699806e+05, - "cpu_time": 4.1552041376784974e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0478882934772906e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2731, - "real_time": 2.5615622679732266e+05, - "cpu_time": 4.1534437532039772e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0467509478691301e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2731, - "real_time": 2.5581021908323164e+05, - "cpu_time": 4.1537005346027086e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0495193736940396e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2731, - "real_time": 2.5617862034589736e+05, - "cpu_time": 4.1580573452947597e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0465720335760109e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5603185674110483e+05, - "cpu_time": 4.1550535613328463e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0477457242803764e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5601396407699809e+05, - "cpu_time": 4.1548620358842850e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0478882934772906e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4785942350134084e+02, - "cpu_time": 1.8374055663519712e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1828902639890143e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7750400822524921e-04, - "cpu_time": 4.4220983899003543e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7765485722340276e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2231, - "real_time": 3.1390766957996006e+05, - "cpu_time": 5.6248260466158402e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3403962426375241e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2231, - "real_time": 3.1375634780745150e+05, - "cpu_time": 5.6192391842223029e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3420072847211313e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2231, - "real_time": 3.1330253201395320e+05, - "cpu_time": 5.6174750918870745e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3468481510813351e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2231, - "real_time": 3.1329464893295511e+05, - "cpu_time": 5.6101820663379703e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3469323640583296e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2231, - "real_time": 3.1346613509415183e+05, - "cpu_time": 5.6175198520842730e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3451013765332341e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1354546668569435e+05, - "cpu_time": 5.6178484482294938e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3442570838063111e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1346613509415183e+05, - "cpu_time": 5.6175198520842730e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3451013765332341e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7562750466428673e+02, - "cpu_time": 5.2354992000440950e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9390166174691832e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.7906710174375608e-04, - "cpu_time": 9.3194027006800130e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.7882496584984482e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1650, - "real_time": 4.2335142076340027e+05, - "cpu_time": 8.5218961090909108e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9536907097615290e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1650, - "real_time": 4.2378826694788801e+05, - "cpu_time": 8.5296862545454025e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9485843841398287e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1650, - "real_time": 4.2402724724855612e+05, - "cpu_time": 8.5379048848485190e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9457953789717016e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1650, - "real_time": 4.2328593462254060e+05, - "cpu_time": 8.5167406363636348e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9544570902647791e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1650, - "real_time": 4.2458070937727555e+05, - "cpu_time": 8.5456210121212492e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9393482880459957e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2380671579193213e+05, - "cpu_time": 8.5303697793939430e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9483751702367659e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2378826694788801e+05, - "cpu_time": 8.5296862545454013e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9485843841398287e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3069462565275012e+02, - "cpu_time": 1.1698309154039093e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1933110533477971e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2522090988130886e-03, - "cpu_time": 1.3713718697514917e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2515847809194032e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1046, - "real_time": 6.6615245410732669e+05, - "cpu_time": 1.4761157418738003e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2963124644201002e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1046, - "real_time": 6.6754145222318929e+05, - "cpu_time": 1.4781856806883353e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2832113062510681e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1046, - "real_time": 6.6683085582550277e+05, - "cpu_time": 1.4773695669216048e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2899068982158365e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1046, - "real_time": 6.6593298896653915e+05, - "cpu_time": 1.4762108986615634e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2983874796608839e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1046, - "real_time": 6.6725599968380318e+05, - "cpu_time": 1.4775264024856535e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2858992680284357e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6674275016127224e+05, - "cpu_time": 1.4770816581261915e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2907434833152657e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6683085582550277e+05, - "cpu_time": 1.4773695669216048e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2899068982158365e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.9160597308517561e+02, - "cpu_time": 8.9313648024606607e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5257991529252566e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0372905785895525e-03, - "cpu_time": 6.0466290088463258e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0373653241836074e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 601, - "real_time": 1.1526615705229528e+06, - "cpu_time": 2.7318829850249547e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2775983988033533e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 601, - "real_time": 1.1653786464307625e+06, - "cpu_time": 2.7564528069883501e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.1981823467351341e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 601, - "real_time": 1.1592970594621191e+06, - "cpu_time": 2.7387349134775260e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2359434810367556e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 601, - "real_time": 1.1564492912011566e+06, - "cpu_time": 2.7390869584026420e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2537620662010145e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 601, - "real_time": 1.1607273086632746e+06, - "cpu_time": 2.7403385757071390e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2270273451742516e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1589027752560531e+06, - "cpu_time": 2.7412992479201225e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2385027275901022e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1592970594621191e+06, - "cpu_time": 2.7390869584026420e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2359434810367556e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7537750837863377e+03, - "cpu_time": 9.0924321071382055e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9687060225233484e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1019619464937587e-03, - "cpu_time": 3.3168331089853879e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1012708487459708e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 316, - "real_time": 2.2050644885571790e+06, - "cpu_time": 5.3987580221518911e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6084922173762321e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 316, - "real_time": 2.2086522805716703e+06, - "cpu_time": 5.4010532499999879e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.5961327854004784e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 316, - "real_time": 2.2053313485782924e+06, - "cpu_time": 5.3995564873418016e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6075715383158827e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 316, - "real_time": 2.2069815586061701e+06, - "cpu_time": 5.4003301265823031e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6018831850120821e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 316, - "real_time": 2.2075153176991055e+06, - "cpu_time": 5.3994505632911287e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6000451120252705e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2067089988024840e+06, - "cpu_time": 5.3998296898734234e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6028249676259890e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2069815586061701e+06, - "cpu_time": 5.3995564873418007e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6018831850120821e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5085686200941138e+03, - "cpu_time": 8.8238094983434439e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1972951537506506e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8362825407100331e-04, - "cpu_time": 1.6340903334212899e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8360052689382450e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 160, - "real_time": 4.4008672790369019e+06, - "cpu_time": 1.1199404868750039e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6245044152622452e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 160, - "real_time": 4.4398016179911792e+06, - "cpu_time": 1.1285354068749953e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.5576421847384138e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 160, - "real_time": 4.3665882578352466e+06, - "cpu_time": 1.1178530843750067e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6843590507511559e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 160, - "real_time": 4.3806326109915972e+06, - "cpu_time": 1.1215644887499999e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6597229166872864e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 160, - "real_time": 4.2212305910652503e+06, - "cpu_time": 1.0929014993750030e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.9489692107846584e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3618240713840351e+06, - "cpu_time": 1.1161589932500018e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6950395556447525e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3806326109915972e+06, - "cpu_time": 1.1199404868750039e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6597229166872864e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3288437345108701e+04, - "cpu_time": 1.3605841171524982e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4974549366529331e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9094863979390333e-02, - "cpu_time": 1.2189877296878522e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9460003107514424e-02, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 77, - "real_time": 8.9442041134098899e+06, - "cpu_time": 2.2915713870130036e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.5030559621716194e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 77, - "real_time": 8.9026747706842106e+06, - "cpu_time": 2.2844621441558354e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.5380563402118282e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 77, - "real_time": 8.9034936088439710e+06, - "cpu_time": 2.2868627779220786e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.5373630788412971e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 77, - "real_time": 8.9314026371031608e+06, - "cpu_time": 2.2899564636363663e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.5138101736914072e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 77, - "real_time": 8.9142826543032341e+06, - "cpu_time": 2.2884046051948071e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.5282405329164886e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9192115568688940e+06, - "cpu_time": 2.2882514755844180e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.5241052175665283e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9142826543032341e+06, - "cpu_time": 2.2884046051948067e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.5282405329164886e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8152572734788740e+04, - "cpu_time": 2.7495344469706753e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5301671663135372e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0352216806438480e-03, - "cpu_time": 1.2015875336728215e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0336865608166351e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 41, - "real_time": 1.7021081342202861e+07, - "cpu_time": 4.3598392951219492e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8853819743645973e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 41, - "real_time": 1.7027213215464499e+07, - "cpu_time": 4.3612554634146281e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8825422752150908e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 41, - "real_time": 1.6987502393199176e+07, - "cpu_time": 4.3560442463414662e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.9009688942697716e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 41, - "real_time": 1.6987088704254568e+07, - "cpu_time": 4.3533431341463447e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.9011613076691570e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 41, - "real_time": 1.7001598800827816e+07, - "cpu_time": 4.3551266243902199e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8944180234075909e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7004896891189788e+07, - "cpu_time": 4.3571217526829220e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8928944949852419e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7001598800827816e+07, - "cpu_time": 4.3560442463414662e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8944180234075909e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8644920662028158e+04, - "cpu_time": 3.3125562705636796e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.6525093886109125e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0964442055328232e-03, - "cpu_time": 7.6026249863776589e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0962403455548903e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 21, - "real_time": 3.2967441316161837e+07, - "cpu_time": 8.4092913857142821e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1424413082492752e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 21, - "real_time": 3.2946891905296415e+07, - "cpu_time": 8.4122844761904642e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1475198562462072e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 21, - "real_time": 3.2975494152023681e+07, - "cpu_time": 8.4162426666665629e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1404528697116232e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 21, - "real_time": 3.2936096368801028e+07, - "cpu_time": 8.4127463428570434e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1501903866870384e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 21, - "real_time": 3.2952431589365005e+07, - "cpu_time": 8.4070106428571627e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1461501641242847e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2955671066329587e+07, - "cpu_time": 8.4115151028571039e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1453509170036869e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2952431589365005e+07, - "cpu_time": 8.4122844761904627e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1461501641242847e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5829009520527849e+04, - "cpu_time": 3.5246568843488232e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9121685336293988e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.8031215898073932e-04, - "cpu_time": 4.1902758792546405e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8029465808067506e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 6.5106176584959030e+07, - "cpu_time": 1.6470044380000106e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2460826324123154e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 6.5126322954893112e+07, - "cpu_time": 1.6489566779999906e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2435317647495632e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 6.5104769915342331e+07, - "cpu_time": 1.6490727380000010e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2462607992948780e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 6.5052977204322815e+07, - "cpu_time": 1.6456312109999943e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2528261591127386e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 6.5246356278657913e+07, - "cpu_time": 1.6490447239999923e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2283661896321173e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5127320587635040e+07, - "cpu_time": 1.6479419577999979e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2434135090403233e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5106176584959030e+07, - "cpu_time": 1.6489566779999906e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2460826324123154e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1855812785111659e+04, - "cpu_time": 1.5606816124928460e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0865982147071958e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1033128975177597e-03, - "cpu_time": 9.4704889641644642e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1022858679529026e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4186985790729523e+08, - "cpu_time": 3.1891089540000051e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.5684986214734631e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4165958166122437e+08, - "cpu_time": 3.1857974640000182e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.5797331278856163e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4159206449985504e+08, - "cpu_time": 3.1863374380000097e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.5833474693145618e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4180269241333008e+08, - "cpu_time": 3.1903095679999751e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.5720834754690704e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4198231101036072e+08, - "cpu_time": 3.1920988019999754e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.5625042046374846e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4178130149841312e+08, - "cpu_time": 3.1887304451999968e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.5732333797560396e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4180269241333008e+08, - "cpu_time": 3.1891089540000051e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.5720834754690704e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5758409903543704e+05, - "cpu_time": 2.6604317050995980e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4171988797794245e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1114589679316834e-03, - "cpu_time": 8.3432317369577346e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1114405773205648e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3556, - "real_time": 1.9805493237060093e+05, - "cpu_time": 2.7401645838020410e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1702827480402682e+06, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3556, - "real_time": 1.9779080568892800e+05, - "cpu_time": 2.7427686079865252e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1771870610127244e+06, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3556, - "real_time": 1.9711508050761177e+05, - "cpu_time": 2.7342396344206674e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1949348439652110e+06, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3556, - "real_time": 1.9723139651548179e+05, - "cpu_time": 2.7318800871766527e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1918711629647687e+06, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3556, - "real_time": 1.9774131886067847e+05, - "cpu_time": 2.7352781046118966e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1784827060927730e+06, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9758670678866020e+05, - "cpu_time": 2.7368662035995570e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1825517044151491e+06, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9774131886067847e+05, - "cpu_time": 2.7352781046118971e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1784827060927730e+06, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9795514467110581e+02, - "cpu_time": 4.4721351313194617e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0440999586871310e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0140785336169439e-03, - "cpu_time": 1.6340349869634330e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0146445578104613e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3546, - "real_time": 1.9719363241038195e+05, - "cpu_time": 2.7339197349125828e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0385730892861102e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3546, - "real_time": 1.9773232298492134e+05, - "cpu_time": 2.7347927552170987e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0357436604617123e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3546, - "real_time": 1.9706293855317347e+05, - "cpu_time": 2.7349138945290440e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0392618800045898e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3546, - "real_time": 1.9770440070760407e+05, - "cpu_time": 2.7393857952622918e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0358899410787016e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3546, - "real_time": 1.9738844892912131e+05, - "cpu_time": 2.7384328285392234e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0375480485868758e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9741634871704044e+05, - "cpu_time": 2.7362890016920480e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0374033238835981e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9738844892912131e+05, - "cpu_time": 2.7349138945290435e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0375480485868758e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9920452141288598e+02, - "cpu_time": 2.4458752142387502e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5722863430467271e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5156015363334469e-03, - "cpu_time": 8.9386582072518148e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5155979423323552e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3544, - "real_time": 1.9760457264310308e+05, - "cpu_time": 2.7413309565462917e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0728265268425010e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3544, - "real_time": 1.9718634217788841e+05, - "cpu_time": 2.7376681743792316e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0772229733359832e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3544, - "real_time": 1.9763446194439041e+05, - "cpu_time": 2.7358362556433387e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0725130423622761e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3544, - "real_time": 1.9711903327124447e+05, - "cpu_time": 2.7330505784424726e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0779322686529838e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3544, - "real_time": 1.9717347623589716e+05, - "cpu_time": 2.7350977934537013e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0773585160610396e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9734357725450472e+05, - "cpu_time": 2.7365967516930075e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0755706654509567e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9718634217788844e+05, - "cpu_time": 2.7358362556433387e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0772229733359832e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5338198530841115e+02, - "cpu_time": 3.1209460477710377e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6637875520874877e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2839636781370204e-03, - "cpu_time": 1.1404479106540820e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2834000771102293e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3525, - "real_time": 1.9829346754601397e+05, - "cpu_time": 2.7600784113475023e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1312505658306912e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3525, - "real_time": 1.9838245526527497e+05, - "cpu_time": 2.7609588056737697e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1293974253145233e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3525, - "real_time": 1.9878946879221429e+05, - "cpu_time": 2.7612552226950106e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1209426484069586e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3525, - "real_time": 1.9860491580957323e+05, - "cpu_time": 2.7526912340425281e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1247720211793095e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3525, - "real_time": 1.9826530229964078e+05, - "cpu_time": 2.7540581645390304e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1318374445667408e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9846712194254348e+05, - "cpu_time": 2.7578083676595689e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1276400210596450e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9838245526527500e+05, - "cpu_time": 2.7600784113475028e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1293974253145233e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2413729341305390e+02, - "cpu_time": 4.0990318235780234e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6589454577323610e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1293421863493439e-03, - "cpu_time": 1.4863367127487151e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1287189372042961e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3504, - "real_time": 1.9994400853020581e+05, - "cpu_time": 2.7902466238584160e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1942940528397217e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3504, - "real_time": 1.9961063898663933e+05, - "cpu_time": 2.7856307448630605e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2079793357590720e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3504, - "real_time": 1.9932876442675744e+05, - "cpu_time": 2.7810503881278663e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2195863939247131e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3504, - "real_time": 2.0011069485519003e+05, - "cpu_time": 2.7856940781962808e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1874684468295261e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3504, - "real_time": 1.9967867134570979e+05, - "cpu_time": 2.7838364126712718e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2051828017394394e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9973455562890050e+05, - "cpu_time": 2.7852916495433793e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2029022062184960e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9967867134570979e+05, - "cpu_time": 2.7856307448630605e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2051828017394394e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0351940731219349e+02, - "cpu_time": 3.3516681540987679e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2466371896526270e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5196139013427474e-03, - "cpu_time": 1.2033454933339709e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5197513737364443e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3472, - "real_time": 2.0198949265409389e+05, - "cpu_time": 2.8274130443548097e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6222626023480862e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3472, - "real_time": 2.0134021443704332e+05, - "cpu_time": 2.8270197292626504e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6274940449239543e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3472, - "real_time": 2.0129576394806401e+05, - "cpu_time": 2.8217181048387563e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6278534310565233e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3472, - "real_time": 2.0183124912607382e+05, - "cpu_time": 2.8230144326036843e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6235345191532496e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3472, - "real_time": 2.0134598775433504e+05, - "cpu_time": 2.8234609591013455e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6274473787866426e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0156054158392205e+05, - "cpu_time": 2.8245252540322498e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6257183952536914e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0134598775433504e+05, - "cpu_time": 2.8234609591013455e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6274473787866426e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2479462273869609e+02, - "cpu_time": 2.5424953936777359e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6178480243321994e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6113998314668356e-03, - "cpu_time": 9.0014964109388224e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6102715156419741e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3412, - "real_time": 2.0526517730460508e+05, - "cpu_time": 2.9116833851113205e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1927480764429551e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3412, - "real_time": 2.0480012892929543e+05, - "cpu_time": 2.9149369519343699e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1999979854810268e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3412, - "real_time": 2.0477710966317524e+05, - "cpu_time": 2.9153461283704196e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2003577014929044e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3412, - "real_time": 2.0540116944764237e+05, - "cpu_time": 2.9144247127783828e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1906342196705651e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3412, - "real_time": 2.0494372398316301e+05, - "cpu_time": 2.9153333352871984e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1977558876301116e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0503746186557622e+05, - "cpu_time": 2.9143449026963382e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1962987741435128e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0494372398316301e+05, - "cpu_time": 2.9149369519343699e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1977558876301116e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8152908773026439e+02, - "cpu_time": 1.5346025253369598e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3868230816845124e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3730617086688114e-03, - "cpu_time": 5.2656860343370919e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3724696568330084e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3333, - "real_time": 2.1016275682876390e+05, - "cpu_time": 3.0751263756375253e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2366901718364227e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3333, - "real_time": 2.1015387818703757e+05, - "cpu_time": 3.0790018601859995e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2369536613236105e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3333, - "real_time": 2.0995542223209294e+05, - "cpu_time": 3.0735035913591977e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2428490108299220e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3333, - "real_time": 2.1015681027352478e+05, - "cpu_time": 3.0809669696970028e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2368666439791441e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3333, - "real_time": 2.1024004883532313e+05, - "cpu_time": 3.0798805160515482e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2343973341951656e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1013378327134848e+05, - "cpu_time": 3.0776958625862550e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2375513644328535e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1015681027352475e+05, - "cpu_time": 3.0790018601860001e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2368666439791441e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0592278546111535e+02, - "cpu_time": 3.2154270107886521e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1456600223164615e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0407309006727347e-04, - "cpu_time": 1.0447513836167877e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0431007915274762e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3091, - "real_time": 2.2676808594268651e+05, - "cpu_time": 3.4238437851827691e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1560004085683134e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3091, - "real_time": 2.2676875725629117e+05, - "cpu_time": 3.4166471562601294e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1559969864090590e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3091, - "real_time": 2.2655270053611585e+05, - "cpu_time": 3.4181200355872296e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1570994271075146e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3091, - "real_time": 2.2626898706589645e+05, - "cpu_time": 3.4177396408928826e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1585502874225342e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3091, - "real_time": 2.2674438127765324e+05, - "cpu_time": 3.4211560757036007e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1561212609674292e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2662058241572866e+05, - "cpu_time": 3.4195013387253217e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1567536740949700e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2674438127765324e+05, - "cpu_time": 3.4181200355872291e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1561212609674292e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1637148126913240e+02, - "cpu_time": 2.9475808244842079e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1053614982981812e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.5477418230355358e-04, - "cpu_time": 8.6199142287307000e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.5557206607794229e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2737, - "real_time": 2.5548368425838032e+05, - "cpu_time": 4.1457165107782581e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0521388734545085e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2737, - "real_time": 2.5535820352402201e+05, - "cpu_time": 4.1476520314213180e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0531472761190507e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2737, - "real_time": 2.5523710198571807e+05, - "cpu_time": 4.1452250383631949e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0541214263956690e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2737, - "real_time": 2.5535524076046157e+05, - "cpu_time": 4.1436857983192790e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0531710977955346e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2737, - "real_time": 2.5551638240658175e+05, - "cpu_time": 4.1502440518815507e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0518762635177910e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5539012258703276e+05, - "cpu_time": 4.1465046861527202e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0528909874565110e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5535820352402198e+05, - "cpu_time": 4.1457165107782581e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0531472761190507e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1218979579277723e+02, - "cpu_time": 2.5250794407032603e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0186831180610845e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.3928792020742617e-04, - "cpu_time": 6.0896577523131224e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3931622152207139e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2247, - "real_time": 3.1162083526800957e+05, - "cpu_time": 5.6205477659100899e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3649097920495977e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2247, - "real_time": 3.1159919732777483e+05, - "cpu_time": 5.6189200356031233e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3651434566982875e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2247, - "real_time": 3.1140166404802131e+05, - "cpu_time": 5.6157368046284548e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3672780882709055e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2247, - "real_time": 3.1137254638450232e+05, - "cpu_time": 5.6158247797062795e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3675929756027775e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2247, - "real_time": 3.1174324574576906e+05, - "cpu_time": 5.6215270093457890e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3635885117303495e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1154749775481544e+05, - "cpu_time": 5.6185112790387473e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3657025648703837e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1159919732777483e+05, - "cpu_time": 5.6189200356031233e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3651434566982875e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5671946635086425e+02, - "cpu_time": 2.6610137592203228e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6930917056792877e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0303554828805199e-04, - "cpu_time": 4.7361545204116544e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0304258116893057e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1664, - "real_time": 4.2092511610182835e+05, - "cpu_time": 8.4881228425480996e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9822448691625862e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1664, - "real_time": 4.2090424961735646e+05, - "cpu_time": 8.4901561057693081e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9824918658020639e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1664, - "real_time": 4.2098733486175031e+05, - "cpu_time": 8.4897106490384904e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9815085308651676e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1664, - "real_time": 4.2070185147097684e+05, - "cpu_time": 8.4887042968750081e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9848889247036676e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1664, - "real_time": 4.2109935676447861e+05, - "cpu_time": 8.4859467668269447e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9801833375227394e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2092358176327823e+05, - "cpu_time": 8.4885281322115695e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9822635056112452e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2092511610182829e+05, - "cpu_time": 8.4887042968750093e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9822448691625862e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4534589512820546e+02, - "cpu_time": 1.6513165143143380e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7206399419750781e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4530233378548517e-04, - "cpu_time": 1.9453508177089704e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4535305891332670e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1049, - "real_time": 6.6211415163762472e+05, - "cpu_time": 1.4684898083889463e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3347143232418680e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1049, - "real_time": 6.6179781763754901e+05, - "cpu_time": 1.4672240390848629e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3377422654136353e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1049, - "real_time": 6.6322242949660460e+05, - "cpu_time": 1.4702880924690126e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3241286986984701e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1049, - "real_time": 6.6301346848851105e+05, - "cpu_time": 1.4698512459485293e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3261218653097095e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1049, - "real_time": 6.6202617267251469e+05, - "cpu_time": 1.4681465252621232e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3355561655034466e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6243480798656086e+05, - "cpu_time": 1.4687999422306949e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3316526636334267e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6211415163762472e+05, - "cpu_time": 1.4684898083889466e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3347143232418680e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3850521505588290e+02, - "cpu_time": 1.2576205803756307e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1011088060319005e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.6387630504590966e-04, - "cpu_time": 8.5622319569652065e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6358867584040396e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 605, - "real_time": 1.1477059224805185e+06, - "cpu_time": 2.7230125107438243e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3090221420743685e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 605, - "real_time": 1.1471746364331320e+06, - "cpu_time": 2.7215280727272676e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3124071380120392e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 605, - "real_time": 1.1473119089549237e+06, - "cpu_time": 2.7207576363636227e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3115322298372278e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 605, - "real_time": 1.1471489767644031e+06, - "cpu_time": 2.7209807636363958e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3125707034674177e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 605, - "real_time": 1.1474002443238602e+06, - "cpu_time": 2.7213736264462746e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3109693339338961e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1473483377913677e+06, - "cpu_time": 2.7215305219834773e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3113003094649906e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1473119089549237e+06, - "cpu_time": 2.7213736264462750e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3115322298372278e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2461363358792431e+02, - "cpu_time": 8.8324675476048219e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4311139730433770e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9576760273196803e-04, - "cpu_time": 3.2454045531584319e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9574000690283501e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 317, - "real_time": 2.2007421155574759e+06, - "cpu_time": 5.3842513217665609e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6234356953495750e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 317, - "real_time": 2.2026217992091402e+06, - "cpu_time": 5.3898247917980328e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6169299722829952e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 317, - "real_time": 2.2005317064313577e+06, - "cpu_time": 5.3857516403785646e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6241646284696875e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 317, - "real_time": 2.2018122118060426e+06, - "cpu_time": 5.3844650725553511e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6197306518880835e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 317, - "real_time": 2.1998285990184885e+06, - "cpu_time": 5.3842447476340178e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6266014577161140e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2011072864045007e+06, - "cpu_time": 5.3857075148265045e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6221724811412907e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2007421155574759e+06, - "cpu_time": 5.3844650725553501e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6234356953495750e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1057070518157193e+03, - "cpu_time": 2.3852549980754511e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8284012282100213e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.0234128006631010e-04, - "cpu_time": 4.4288610020299068e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.0227166043306109e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 143, - "real_time": 4.8724233654777072e+06, - "cpu_time": 1.1986320699300727e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 6.8866002568129101e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 143, - "real_time": 4.7721216468127454e+06, - "cpu_time": 1.1832323615384463e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.0313446478068476e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 143, - "real_time": 4.3542008925151154e+06, - "cpu_time": 1.1213815867132926e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7062204588860769e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 143, - "real_time": 4.3713254300499717e+06, - "cpu_time": 1.1229729762237877e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6760315691290045e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 143, - "real_time": 4.7260883453113213e+06, - "cpu_time": 1.1758973972027697e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.0998317315182705e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6192319360333728e+06, - "cpu_time": 1.1604232783216739e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.2800057328306236e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.7260883453113222e+06, - "cpu_time": 1.1758973972027700e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.0998317315182705e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4010338687080162e+05, - "cpu_time": 3.5869183149944758e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8326176767226988e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.1979071455109320e-02, - "cpu_time": 3.0910430547224577e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2645805750382205e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72, - "real_time": 9.5887914196484610e+06, - "cpu_time": 2.3987292472222224e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 6.9986780463788939e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72, - "real_time": 9.5677758282464407e+06, - "cpu_time": 2.3968491791666541e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0140506220764532e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72, - "real_time": 9.4821974764474556e+06, - "cpu_time": 2.3806990305555724e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0773535529806967e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72, - "real_time": 9.5065621296978667e+06, - "cpu_time": 2.3838922986110825e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0592147912604904e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72, - "real_time": 9.5644581467948034e+06, - "cpu_time": 2.3921599833333258e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0164836282428837e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5419570001670066e+06, - "cpu_time": 2.3904659477777716e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0331561281878834e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5644581467948034e+06, - "cpu_time": 2.3921599833333261e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0164836282428837e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5250342158399661e+04, - "cpu_time": 7.9136441120105956e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3407323384565845e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7422496409916404e-03, - "cpu_time": 3.3105027575763162e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7499760812466643e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 40, - "real_time": 1.7292021773755550e+07, - "cpu_time": 4.4120073975000195e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7618296897882090e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 40, - "real_time": 1.7382854688912630e+07, - "cpu_time": 4.4146457700000495e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7212707810074825e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 40, - "real_time": 1.7301690112799406e+07, - "cpu_time": 4.4109988299999259e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7574923099974327e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 40, - "real_time": 1.7368670692667365e+07, - "cpu_time": 4.4149911925001107e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7275762995877113e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 40, - "real_time": 1.7365410737693310e+07, - "cpu_time": 4.4174028899999484e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7290269736417685e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7342129601165656e+07, - "cpu_time": 4.4140092160000108e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7394392108045216e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7365410737693310e+07, - "cpu_time": 4.4146457700000495e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7290269736417685e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1985474319432491e+04, - "cpu_time": 2.5473615383582546e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8751554109647553e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4210102960256063e-03, - "cpu_time": 5.7710834157856188e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4228569537014704e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 21, - "real_time": 3.3223464552845273e+07, - "cpu_time": 8.4711727809525162e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0796948666514387e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 21, - "real_time": 3.3321659125032879e+07, - "cpu_time": 8.4931135952382684e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0558850624078922e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 21, - "real_time": 3.3255099185875483e+07, - "cpu_time": 8.4849057285715550e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0720088819946508e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 21, - "real_time": 3.3312836573237464e+07, - "cpu_time": 8.4836245619047046e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0580185782093687e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 21, - "real_time": 3.3293270461616062e+07, - "cpu_time": 8.4845804523808971e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0627541926071892e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3281265979721434e+07, - "cpu_time": 8.4834794238095880e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0656723163741093e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3293270461616058e+07, - "cpu_time": 8.4845804523808971e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0627541926071892e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1225362939808190e+04, - "cpu_time": 7.8666764233693830e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9958675770020075e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2386957564933727e-03, - "cpu_time": 9.2729362922610551e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2393099031198444e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.9692921704716146e+07, - "cpu_time": 1.6257642555555347e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.7367452531010475e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.9666893515321940e+07, - "cpu_time": 1.6246328655555290e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.7389462336289825e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.9677310254838735e+07, - "cpu_time": 1.6256611599999991e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.7380652068058023e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.9615516795052424e+07, - "cpu_time": 1.6252997511111289e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.7432949456576662e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.9624600708484650e+07, - "cpu_time": 1.6259006544444472e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.7425256418622398e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9655448595682785e+07, - "cpu_time": 1.6254517373333281e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.7399154562111473e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9666893515321940e+07, - "cpu_time": 1.6256611599999994e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.7389462336289825e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3761268760949075e+04, - "cpu_time": 5.0909303262584333e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8568785920301201e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2384129844419573e-04, - "cpu_time": 3.1320095265396648e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2387454421217893e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.3113647699356079e+08, - "cpu_time": 3.1226671240000314e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.1879721692746410e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.3146262466907501e+08, - "cpu_time": 3.1237013420000041e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.1676585014401035e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.3139264583587646e+08, - "cpu_time": 3.1223789239999181e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.1720085410352335e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.3159430623054504e+08, - "cpu_time": 3.1246687760000217e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.1594854272712307e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.3130146861076355e+08, - "cpu_time": 3.1240766480000275e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.1776832762095938e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3137750446796420e+08, - "cpu_time": 3.1234985628000009e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.1729615830461617e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3139264583587646e+08, - "cpu_time": 3.1237013420000041e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.1720085410352335e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7201265134027338e+05, - "cpu_time": 9.6041427977631232e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0703385249432070e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3093006450142907e-03, - "cpu_time": 3.0748030148455304e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3096091472685951e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3472, - "real_time": 2.0079822957400774e+05, - "cpu_time": 2.8061618058755802e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0996465565080419e+06, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3472, - "real_time": 2.0111911003850724e+05, - "cpu_time": 2.8028766129031964e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0915101991249863e+06, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3472, - "real_time": 2.0019578090385391e+05, - "cpu_time": 2.7999714775345521e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1149929103240520e+06, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3472, - "real_time": 2.0033928737789232e+05, - "cpu_time": 2.8015705155531073e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1113289530099407e+06, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3472, - "real_time": 2.0081887499476629e+05, - "cpu_time": 2.7968775460828299e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0991222813427635e+06, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0065425657780556e+05, - "cpu_time": 2.8014915915898531e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1033201800619569e+06, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0079822957400774e+05, - "cpu_time": 2.8015705155531073e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0996465565080419e+06, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7859005772039586e+02, - "cpu_time": 3.4400427754502482e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6305060783023619e+03, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8867781036760317e-03, - "cpu_time": 1.2279325719832038e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8871059895335517e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3492, - "real_time": 2.0048209889895920e+05, - "cpu_time": 2.8021352262314170e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0215375892648499e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3492, - "real_time": 2.0077804343675301e+05, - "cpu_time": 2.7980425544100167e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0200318545514362e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3492, - "real_time": 2.0020590112677281e+05, - "cpu_time": 2.7955873396334215e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0229468704337450e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3492, - "real_time": 2.0010289936201760e+05, - "cpu_time": 2.7985579209621903e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0234734261870168e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3492, - "real_time": 2.0071637542457730e+05, - "cpu_time": 2.8001400887744559e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0203452486962490e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0045706364981594e+05, - "cpu_time": 2.7988926260022999e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0216669978266595e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0048209889895917e+05, - "cpu_time": 2.7985579209621897e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0215375892648499e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9975504147923357e+02, - "cpu_time": 2.4408086144720738e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5279658193549971e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4953578388381664e-03, - "cpu_time": 8.7206225483480468e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4955614917633254e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3493, - "real_time": 2.0020707841227224e+05, - "cpu_time": 2.7992330088748166e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0458817103186522e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3493, - "real_time": 2.0082532631256929e+05, - "cpu_time": 2.7975521042083605e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0395833908044487e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3493, - "real_time": 2.0004602952104679e+05, - "cpu_time": 2.7989455339250230e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0475287661578212e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3493, - "real_time": 2.0008867507719275e+05, - "cpu_time": 2.7973641454337595e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0470923696305119e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3493, - "real_time": 2.0075189776076315e+05, - "cpu_time": 2.8056168365302822e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0403294044478819e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0038380141676887e+05, - "cpu_time": 2.7997423257944488e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0440831282718632e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0020707841227224e+05, - "cpu_time": 2.7989455339250236e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0458817103186522e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7511984158644145e+02, - "cpu_time": 3.3858887243799728e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8242950721954956e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8720068135959118e-03, - "cpu_time": 1.2093572659116765e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8709097586597095e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3476, - "real_time": 2.0115745997415256e+05, - "cpu_time": 2.8163863377445471e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0724316170290776e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3476, - "real_time": 2.0180874141037650e+05, - "cpu_time": 2.8209657192174724e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0592889796292976e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3476, - "real_time": 2.0147552830217351e+05, - "cpu_time": 2.8188567520137707e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0660024912373565e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3476, - "real_time": 2.0079713262475186e+05, - "cpu_time": 2.8114871029919258e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0797395325904116e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3476, - "real_time": 2.0114300263800038e+05, - "cpu_time": 2.8151685960875003e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0727243267533630e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0127637298989098e+05, - "cpu_time": 2.8165729016110429e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0700373894479021e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0115745997415259e+05, - "cpu_time": 2.8163863377445476e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0724316170290776e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8232128412728906e+02, - "cpu_time": 3.6188757528248573e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7280698837500822e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8994841691950151e-03, - "cpu_time": 1.2848507314527193e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8987712259808968e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3454, - "real_time": 2.0236487683519768e+05, - "cpu_time": 2.8497764418066217e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0962666329408705e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3454, - "real_time": 2.0293178270617043e+05, - "cpu_time": 2.8476760191082384e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0736490763118997e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3454, - "real_time": 2.0232874849529023e+05, - "cpu_time": 2.8474567544874904e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0977123230618834e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3454, - "real_time": 2.0300266126821385e+05, - "cpu_time": 2.8531616589461407e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0708301544642881e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3454, - "real_time": 2.0252784599204123e+05, - "cpu_time": 2.8498460683265683e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0897517670947045e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0263118305938269e+05, - "cpu_time": 2.8495833885350113e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0856419907747298e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0252784599204126e+05, - "cpu_time": 2.8497764418066217e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0897517670947045e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1678874165114883e+02, - "cpu_time": 2.2951535830728835e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2636125753172924e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5633760651652087e-03, - "cpu_time": 8.0543478471526179e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5627857092349678e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3423, - "real_time": 2.0430050351584330e+05, - "cpu_time": 2.8939940286298346e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6039118570972526e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3423, - "real_time": 2.0493826724368081e+05, - "cpu_time": 2.8941019281332998e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5989205159540740e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3423, - "real_time": 2.0432719267639346e+05, - "cpu_time": 2.8918908705814090e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6037023545807168e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3423, - "real_time": 2.0424314807511278e+05, - "cpu_time": 2.8926331317557476e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6043622666817293e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3423, - "real_time": 2.0625136914312580e+05, - "cpu_time": 2.9078455623722868e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5887409686604804e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0481209613083125e+05, - "cpu_time": 2.8960931042945158e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5999275925948507e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0432719267639349e+05, - "cpu_time": 2.8939940286298346e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6037023545807168e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5264092787470634e+02, - "cpu_time": 6.6355359650168998e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6321995661318873e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1630398984347618e-03, - "cpu_time": 2.2912025705172580e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1453123234004739e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3361, - "real_time": 2.0803874763096240e+05, - "cpu_time": 2.9927518119607470e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1501823937266517e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3361, - "real_time": 2.0864267254017439e+05, - "cpu_time": 2.9934074144599162e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1410640595289040e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3361, - "real_time": 2.0814214632306769e+05, - "cpu_time": 2.9931578786075523e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1486174788588154e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3361, - "real_time": 2.0807649719977612e+05, - "cpu_time": 2.9943320202321495e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1496108826302612e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3361, - "real_time": 2.0864314940223671e+05, - "cpu_time": 2.9930675513240264e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1410568805043852e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0830864261924347e+05, - "cpu_time": 2.9933433353168785e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1461063390498036e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0814214632306769e+05, - "cpu_time": 2.9931578786075523e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1486174788588154e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0737867243258114e+02, - "cpu_time": 6.0040712681579656e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6401369848313747e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4755925081535030e-03, - "cpu_time": 2.0058077525952659e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4748824371374563e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3242, - "real_time": 2.1571409771862952e+05, - "cpu_time": 3.1476321190621681e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0761907258822775e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3242, - "real_time": 2.1581700282152122e+05, - "cpu_time": 3.1484490623071801e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0732934980287635e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3242, - "real_time": 2.1622391740314203e+05, - "cpu_time": 3.1498910795806197e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0618640885883486e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3242, - "real_time": 2.1571356235447619e+05, - "cpu_time": 3.1454132233188045e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0762058059480274e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3242, - "real_time": 2.1581863330931097e+05, - "cpu_time": 3.1476937816162850e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0732476149150562e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1585744272141601e+05, - "cpu_time": 3.1478158531770116e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0721603466724956e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1581700282152122e+05, - "cpu_time": 3.1476937816162850e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0732934980287635e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1136141921832262e+02, - "cpu_time": 1.6224062643618902e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9390405797569698e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.7917132971460309e-04, - "cpu_time": 5.1540698059717696e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7807703365599113e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3051, - "real_time": 2.3032695895632633e+05, - "cpu_time": 3.4884667125533696e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1381385886734462e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3051, - "real_time": 2.2933989036494031e+05, - "cpu_time": 3.4713144739430712e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1430370860597332e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3051, - "real_time": 2.2960677086380997e+05, - "cpu_time": 3.4706018387414434e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1417084914951804e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3051, - "real_time": 2.2966120633061169e+05, - "cpu_time": 3.4733710783350200e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1414378779436841e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3051, - "real_time": 2.2914061399579039e+05, - "cpu_time": 3.4698558275974065e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1440311493833036e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2961508810229576e+05, - "cpu_time": 3.4747219862340624e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1416706387110693e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2960677086380994e+05, - "cpu_time": 3.4713144739430712e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1417084914951804e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4994878948247907e+02, - "cpu_time": 7.7943683031494470e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2344001918367264e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9595784980907809e-03, - "cpu_time": 2.2431631462973699e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9571320449821971e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2705, - "real_time": 2.5832322560631207e+05, - "cpu_time": 4.2000765841036983e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0295813462743828e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2705, - "real_time": 2.5936231665251267e+05, - "cpu_time": 4.2187723770794470e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0214501735131717e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2705, - "real_time": 2.5870965300093434e+05, - "cpu_time": 4.2021406876154948e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0265498172119093e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2705, - "real_time": 2.5830442080912893e+05, - "cpu_time": 4.2014958447320986e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0297291016455986e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2705, - "real_time": 2.5865648216404396e+05, - "cpu_time": 4.2016348539743177e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0269664058428216e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5867121964658643e+05, - "cpu_time": 4.2048240695010114e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0268553688975770e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5865648216404393e+05, - "cpu_time": 4.2016348539743171e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0269664058428216e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2864630726979959e+02, - "cpu_time": 7.8348997445575014e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3545163863424486e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6571086178641921e-03, - "cpu_time": 1.8633121422098574e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6550349066924283e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2225, - "real_time": 3.1464600667430693e+05, - "cpu_time": 5.6725122292133432e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3325577879823241e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2225, - "real_time": 3.1443056008213438e+05, - "cpu_time": 5.6701506651685690e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3348412435677209e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2225, - "real_time": 3.1449233844949538e+05, - "cpu_time": 5.6715783505616058e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3341861527364101e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2225, - "real_time": 3.1438448130194977e+05, - "cpu_time": 5.6701235730338597e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3353300253802853e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2225, - "real_time": 3.1451153013007611e+05, - "cpu_time": 5.6678037123595388e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3339826987148247e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1449298332759255e+05, - "cpu_time": 5.6704337060673838e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3341795816763134e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1449233844949544e+05, - "cpu_time": 5.6701506651685701e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3341861527364101e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9284812014469452e+01, - "cpu_time": 1.7835099523198230e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0524184086569371e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1569801959953147e-04, - "cpu_time": 3.1452796113487063e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1564538828104049e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1649, - "real_time": 4.2416253384132683e+05, - "cpu_time": 8.5380818617341702e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9442179180882454e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1649, - "real_time": 4.2408316128894582e+05, - "cpu_time": 8.5408612674347265e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9451432912968731e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1649, - "real_time": 4.2416476301118627e+05, - "cpu_time": 8.5393415767131362e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9441919340779676e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1649, - "real_time": 4.2464010833775013e+05, - "cpu_time": 8.5466491328075668e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9386573684932461e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1649, - "real_time": 4.2392578229927691e+05, - "cpu_time": 8.5333671255304420e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9469791354173479e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2419526975569717e+05, - "cpu_time": 8.5396601928440086e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9438379294747353e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2416253384132683e+05, - "cpu_time": 8.5393415767131350e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9442179180882454e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6696229276346213e+02, - "cpu_time": 4.8084093918295366e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1096248564995746e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.2933821236906115e-04, - "cpu_time": 5.6306800074537469e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2899004798686042e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1044, - "real_time": 6.6672628073037823e+05, - "cpu_time": 1.4745809109195746e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2908934614145823e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1044, - "real_time": 6.6728751988897729e+05, - "cpu_time": 1.4764774109195257e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2856023452946405e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1044, - "real_time": 6.6700505584048398e+05, - "cpu_time": 1.4761133936781576e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2882641792194729e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1044, - "real_time": 6.6722942379274720e+05, - "cpu_time": 1.4775064568965379e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2861496367444696e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1044, - "real_time": 6.6660138950335269e+05, - "cpu_time": 1.4754460823754822e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2920720929263897e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6696993395118800e+05, - "cpu_time": 1.4760248509578556e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2885963431199112e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6700505584048398e+05, - "cpu_time": 1.4761133936781574e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2882641792194729e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0191938262857093e+02, - "cpu_time": 1.0986062071809865e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8468542774086627e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5267315250625199e-04, - "cpu_time": 7.4430061693612679e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5270106746846399e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 598, - "real_time": 1.1606351495798316e+06, - "cpu_time": 2.7337277625417602e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2276012001159964e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 598, - "real_time": 1.1635309571546679e+06, - "cpu_time": 2.7393576739129676e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2096130733932018e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 598, - "real_time": 1.1668157896936487e+06, - "cpu_time": 2.7392314096989655e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.1893164920252371e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 598, - "real_time": 1.1601778768146266e+06, - "cpu_time": 2.7323264080268131e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2304498884530373e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 598, - "real_time": 1.1634501300745932e+06, - "cpu_time": 2.7397488963210629e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2101139388434067e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1629219806634737e+06, - "cpu_time": 2.7368784301003139e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2134189185661764e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1634501300745935e+06, - "cpu_time": 2.7392314096989655e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2101139388434067e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6726038458359012e+03, - "cpu_time": 3.5556416517465696e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6564460138771804e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2981798351692684e-03, - "cpu_time": 1.2991595142266680e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2963396865995898e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 317, - "real_time": 2.1976045397483399e+06, - "cpu_time": 5.3835086687696734e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6343198680874825e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 317, - "real_time": 2.1975894138357993e+06, - "cpu_time": 5.3811649022081885e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6343724147797384e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 317, - "real_time": 2.1982839204700021e+06, - "cpu_time": 5.3839925583595941e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6319604777953167e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 317, - "real_time": 2.1966238761737896e+06, - "cpu_time": 5.3802529716088362e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6377281436199064e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 317, - "real_time": 2.1988583055885998e+06, - "cpu_time": 5.3847752996845124e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6299668593283930e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1977920111633064e+06, - "cpu_time": 5.3827388801261606e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6336695527221680e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1976045397483399e+06, - "cpu_time": 5.3835086687696725e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6343198680874825e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3959649957903491e+02, - "cpu_time": 1.9344531483735889e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9163316284400853e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8201817793241991e-04, - "cpu_time": 3.5938082664865390e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8203535118966749e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 163, - "real_time": 4.4217865765551850e+06, - "cpu_time": 1.1309765760736244e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.5884331862395649e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 163, - "real_time": 4.8822770095173204e+06, - "cpu_time": 1.1995563981595309e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 6.8727013921148472e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 163, - "real_time": 4.8866854134969916e+06, - "cpu_time": 1.2000580901840601e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 6.8665013522914505e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 163, - "real_time": 4.2740082985327290e+06, - "cpu_time": 1.1127124319018632e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.8508111487568398e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 163, - "real_time": 4.8758200101234429e+06, - "cpu_time": 1.1993421398772992e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 6.8818028414364071e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6681154616451338e+06, - "cpu_time": 1.1685291272392757e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.2120499841678228e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8758200101234429e+06, - "cpu_time": 1.1993421398772994e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 6.8818028414364071e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9697539777912595e+05, - "cpu_time": 4.3104252604589099e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7257397288442808e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.3617834695645276e-02, - "cpu_time": 3.6887615036542247e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5525609767242476e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72, - "real_time": 9.5297634963774011e+06, - "cpu_time": 2.3918992972222477e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0420282754666929e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72, - "real_time": 9.6299043701340761e+06, - "cpu_time": 2.4005008611110967e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 6.9687985903712206e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72, - "real_time": 9.5515258273937628e+06, - "cpu_time": 2.3907776416666910e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0259836190288954e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72, - "real_time": 9.5784481770048533e+06, - "cpu_time": 2.3946350555555619e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0062355362645702e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72, - "real_time": 9.6147708827629685e+06, - "cpu_time": 2.3990949041666295e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 6.9797673619358387e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5808825507346131e+06, - "cpu_time": 2.3953815519444458e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0045626766134434e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5784481770048551e+06, - "cpu_time": 2.3946350555555619e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0062355362645702e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1929878738253741e+04, - "cpu_time": 4.2975474321319489e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0656173218216263e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.3764108907731860e-03, - "cpu_time": 1.7940972404347959e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3766006007155706e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 40, - "real_time": 1.7557380674406886e+07, - "cpu_time": 4.4509099600000471e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6445188772176619e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 40, - "real_time": 1.7518852464854717e+07, - "cpu_time": 4.4459222525000542e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6613310300580273e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 40, - "real_time": 1.7530048685148358e+07, - "cpu_time": 4.4498557024999745e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6564378348652658e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 40, - "real_time": 1.7543380660936236e+07, - "cpu_time": 4.4501139649999291e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6506193757091522e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 40, - "real_time": 1.7529808264225721e+07, - "cpu_time": 4.4525308225000516e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6565428427364664e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7535894149914388e+07, - "cpu_time": 4.4498665405000113e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6538899921173143e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7530048685148358e+07, - "cpu_time": 4.4501139649999291e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6564378348652658e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4826876563640169e+04, - "cpu_time": 2.4395628180141517e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4694066758799450e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4551585661302338e-04, - "cpu_time": 5.4823280559331759e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4524427219920067e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 21, - "real_time": 3.3339728202138629e+07, - "cpu_time": 8.4895675190474719e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0515190277640238e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 21, - "real_time": 3.3311666299899418e+07, - "cpu_time": 8.4887485095239729e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0583016647477198e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 21, - "real_time": 3.3363812026523408e+07, - "cpu_time": 8.4950687857144669e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0457070009446287e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 21, - "real_time": 3.3308062702417374e+07, - "cpu_time": 8.4886244142856926e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0591734919640932e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 21, - "real_time": 3.3358089803230196e+07, - "cpu_time": 8.4935870523812205e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0470871558720474e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3336271806841802e+07, - "cpu_time": 8.4911192561905652e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0523576682585030e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3339728202138625e+07, - "cpu_time": 8.4895675190474704e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0515190277640238e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5727513866816549e+04, - "cpu_time": 2.9975559035806760e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2148922235546447e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7175738234580679e-04, - "cpu_time": 3.5302247125963606e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7181025478451580e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 7.5525252355469599e+07, - "cpu_time": 1.6435353066666874e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.1084954403481627e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 7.5278051197528839e+07, - "cpu_time": 1.6437984011110985e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.1318386097862206e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 7.5511722928947866e+07, - "cpu_time": 1.6449881855555761e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.1097690686406956e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 7.5517642001310989e+07, - "cpu_time": 1.6468346288888824e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.1092118049803505e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 7.5609767602549657e+07, - "cpu_time": 1.6481163755555725e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.1005496911737108e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5488487217161387e+07, - "cpu_time": 1.6454545795555633e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.1119729229858284e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5517642001310989e+07, - "cpu_time": 1.6449881855555758e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.1092118049803505e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2423146277547846e+05, - "cpu_time": 1.9769770442651320e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1722940855659043e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6457007863741628e-03, - "cpu_time": 1.2014777368082154e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6483387918661235e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.3045530021190643e+08, - "cpu_time": 3.1546723899998599e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.2307259441038904e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.3058685064315796e+08, - "cpu_time": 3.1535474800000429e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.2224344848786526e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.3050521612167358e+08, - "cpu_time": 3.1538917440000206e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.2275778387196503e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.3070787787437439e+08, - "cpu_time": 3.1573372259999812e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.2148210303895521e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.3044191598892212e+08, - "cpu_time": 3.1551228539999557e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.2315704722643633e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3053943216800690e+08, - "cpu_time": 3.1549143387999719e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.2254259540712223e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3050521612167358e+08, - "cpu_time": 3.1546723899998599e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.2275778387196503e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0997817604454902e+05, - "cpu_time": 1.4905035468942937e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.9261984502900289e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.4249007535902923e-04, - "cpu_time": 4.7243867402790824e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.4204738927372714e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3530, - "real_time": 1.9668310546915102e+05, - "cpu_time": 2.7396546005665092e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2063444776176289e+06, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3530, - "real_time": 1.9706429648325217e+05, - "cpu_time": 2.7387645325778471e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1962735933093103e+06, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3530, - "real_time": 1.9690960134668462e+05, - "cpu_time": 2.7377090226627066e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2003558637911044e+06, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3530, - "real_time": 1.9637951560179298e+05, - "cpu_time": 2.7384283371102950e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2143931451404933e+06, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3530, - "real_time": 1.9695860437294282e+05, - "cpu_time": 2.7441066572239040e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1990620225001546e+06, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9679902465476474e+05, - "cpu_time": 2.7397326300282526e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2032858204717375e+06, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9690960134668462e+05, - "cpu_time": 2.7387645325778471e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2003558637911044e+06, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7271190720852462e+02, - "cpu_time": 2.5432057508162106e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2167251942482108e+03, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3857381035649455e-03, - "cpu_time": 9.2826786195921059e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3869553669058163e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3539, - "real_time": 1.9638641767928025e+05, - "cpu_time": 2.7429041621928930e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0428419766506461e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3539, - "real_time": 1.9701137115918208e+05, - "cpu_time": 2.7488679570500483e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0395339050481752e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3539, - "real_time": 1.9671393534090047e+05, - "cpu_time": 2.7383441480643558e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0411057032898385e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3539, - "real_time": 1.9673793547874666e+05, - "cpu_time": 2.7392395818026422e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0409786983971084e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3539, - "real_time": 1.9640269274850999e+05, - "cpu_time": 2.7414950127153145e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0427555607001916e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9665047048132389e+05, - "cpu_time": 2.7421701723650505e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0414431688171921e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9671393534090050e+05, - "cpu_time": 2.7414950127153145e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0411057032898385e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6126849243467962e+02, - "cpu_time": 4.1557708160544854e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3832877232848648e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3285932741233513e-03, - "cpu_time": 1.5155043468619749e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3282411990429769e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3540, - "real_time": 1.9684262669663009e+05, - "cpu_time": 2.7353188446327450e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0808501028147087e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3540, - "real_time": 1.9643182758081410e+05, - "cpu_time": 2.7422961920903443e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0852017977152217e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3540, - "real_time": 1.9658880946992655e+05, - "cpu_time": 2.7365484943505173e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0835367033577725e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3540, - "real_time": 1.9692200646106954e+05, - "cpu_time": 2.7429441045198299e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0800113068164162e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3540, - "real_time": 1.9693230659030718e+05, - "cpu_time": 2.7372395141244691e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0799025162088875e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9674351535974949e+05, - "cpu_time": 2.7388694299435813e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0819004853826012e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9684262669663009e+05, - "cpu_time": 2.7372395141244691e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0808501028147087e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2271475192969683e+02, - "cpu_time": 3.4998462595569680e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3579680019961044e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1320055531307265e-03, - "cpu_time": 1.2778434127942572e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1326036083625624e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3553, - "real_time": 1.9802369437645859e+05, - "cpu_time": 2.7676271066701983e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1368786830258630e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3553, - "real_time": 1.9808641630523704e+05, - "cpu_time": 2.7639114635520079e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1355687849775180e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3553, - "real_time": 1.9750167506963463e+05, - "cpu_time": 2.7623976386150502e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1478129221494891e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3553, - "real_time": 1.9801531205143305e+05, - "cpu_time": 2.7629764762173843e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1370538041382313e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3553, - "real_time": 1.9807201198976126e+05, - "cpu_time": 2.7638331550803443e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1358695343708932e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9793982195850491e+05, - "cpu_time": 2.7641491680269968e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1386367457323991e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9802369437645859e+05, - "cpu_time": 2.7638331550803443e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1368786830258630e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4681477855934185e+02, - "cpu_time": 2.0430055169456426e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1688621602099236e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2469182608999358e-03, - "cpu_time": 7.3910827265661120e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2489286878196915e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3529, - "real_time": 1.9912707443327556e+05, - "cpu_time": 2.7898604278832569e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2279117727358714e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3529, - "real_time": 1.9920950047682351e+05, - "cpu_time": 2.7911376905641000e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2245073456755906e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3529, - "real_time": 1.9918936674958019e+05, - "cpu_time": 2.7959012723150925e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2253386650894254e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3529, - "real_time": 1.9869735132526531e+05, - "cpu_time": 2.7894181326153030e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2457062918667585e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3529, - "real_time": 1.9919648557619928e+05, - "cpu_time": 2.7897698611504980e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2250447103056818e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9908395571222872e+05, - "cpu_time": 2.7912174769056501e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2297017571346670e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9918936674958019e+05, - "cpu_time": 2.7898604278832569e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2253386650894254e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1843655892542134e+02, - "cpu_time": 2.6981066786571154e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0423412869676627e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0972082513829812e-03, - "cpu_time": 9.6664151073181238e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0987447119974287e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3495, - "real_time": 2.0121529091979633e+05, - "cpu_time": 2.8390338855509111e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6285044665448019e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3495, - "real_time": 2.0116300563023525e+05, - "cpu_time": 2.8331938454937097e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6289277393395090e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3495, - "real_time": 2.0112661177323110e+05, - "cpu_time": 2.8318385264662455e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6292224937864363e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3495, - "real_time": 2.0056704748491856e+05, - "cpu_time": 2.8313957367668865e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6337678801630640e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3495, - "real_time": 2.0128121140389002e+05, - "cpu_time": 2.8346976423462480e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6279711241526598e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0107063344241426e+05, - "cpu_time": 2.8340319273248006e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6296787407972944e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0116300563023525e+05, - "cpu_time": 2.8331938454937097e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6289277393395090e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8746037761747255e+02, - "cpu_time": 3.0791903043202831e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3338862387657200e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4296487393311958e-03, - "cpu_time": 1.0865051570632450e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4321143059299549e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3407, - "real_time": 2.0399723476080384e+05, - "cpu_time": 2.9257396976813051e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2125925666023844e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3407, - "real_time": 2.0463231177726528e+05, - "cpu_time": 2.9241858174346230e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2026222755736399e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3407, - "real_time": 2.0432912032985786e+05, - "cpu_time": 2.9187778896391258e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2073744503085142e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3407, - "real_time": 2.0376228476545273e+05, - "cpu_time": 2.9190366422071808e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2162968763055128e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3407, - "real_time": 2.0432381706438315e+05, - "cpu_time": 2.9203612826535257e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2074576983528733e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0420895373955258e+05, - "cpu_time": 2.9216202659231523e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2092687734285849e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0432381706438315e+05, - "cpu_time": 2.9203612826535257e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2074576983528733e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3585849671780517e+02, - "cpu_time": 3.1579671420867442e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2793517086854519e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6446805615886850e-03, - "cpu_time": 1.0808958230883962e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6450325857392486e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3283, - "real_time": 2.1272753162151802e+05, - "cpu_time": 3.0821683307950053e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1614967748134053e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3283, - "real_time": 2.1323680371777111e+05, - "cpu_time": 3.0875369022236363e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1467813114231408e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3283, - "real_time": 2.1271897267521580e+05, - "cpu_time": 3.0817164605542854e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1617446883839428e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3283, - "real_time": 2.1288166804744248e+05, - "cpu_time": 3.0846159579650848e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1570355588715839e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3283, - "real_time": 2.1330697911223717e+05, - "cpu_time": 3.0875912214439083e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1447590953427243e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1297439103483694e+05, - "cpu_time": 3.0847257745963836e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1543634857669604e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1288166804744248e+05, - "cpu_time": 3.0846159579650848e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1570355588715839e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8029043245922924e+02, - "cpu_time": 2.8161042977796944e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0969071645906870e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3160757549173186e-03, - "cpu_time": 9.1291884710502781e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3156368133465301e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3083, - "real_time": 2.2688800586721164e+05, - "cpu_time": 3.4165661141747772e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1553894133717330e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3083, - "real_time": 2.2694981788129351e+05, - "cpu_time": 3.4200863250082941e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1550747317061732e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3083, - "real_time": 2.2656691687120724e+05, - "cpu_time": 3.4169593058710865e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1570268228923144e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3083, - "real_time": 2.2677726053418769e+05, - "cpu_time": 3.4198099481027358e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1559536409536996e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3083, - "real_time": 2.2698309062070088e+05, - "cpu_time": 3.4160744437237305e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1549054129237080e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2683301835492020e+05, - "cpu_time": 3.4178992273761251e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1556700043695257e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2688800586721167e+05, - "cpu_time": 3.4169593058710865e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1553894133717330e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6815645612262156e+02, - "cpu_time": 1.8989950216297598e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5718830267333915e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.4132265814807943e-04, - "cpu_time": 5.5560298747824488e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4172410760195960e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2747, - "real_time": 2.5546982365729535e+05, - "cpu_time": 4.1416743319986400e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0522502129383223e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2747, - "real_time": 2.5562510354777315e+05, - "cpu_time": 4.1454685584276251e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0510035701639025e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2747, - "real_time": 2.5537866577741693e+05, - "cpu_time": 4.1498147542771412e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0529827673896582e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2747, - "real_time": 2.5543738029207962e+05, - "cpu_time": 4.1458759191842470e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0525108713552554e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2747, - "real_time": 2.5543481619905887e+05, - "cpu_time": 4.1444508227156935e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0525314747674234e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5546915789472481e+05, - "cpu_time": 4.1454568773206696e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0522557793229122e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5543738029207964e+05, - "cpu_time": 4.1454685584276251e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0525108713552554e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3136299797713761e+01, - "cpu_time": 2.9362654459155857e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4793889119365893e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6456964341697131e-04, - "cpu_time": 7.0830924860889634e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6444720912927418e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2230, - "real_time": 3.1425165947716718e+05, - "cpu_time": 5.6103797443949885e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3367397382866874e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2230, - "real_time": 3.1398129922227160e+05, - "cpu_time": 5.6073545067260053e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3396129087856884e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2230, - "real_time": 3.1410083705883037e+05, - "cpu_time": 5.6107962645742204e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3383419471868649e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2230, - "real_time": 3.1423406652488117e+05, - "cpu_time": 5.6144110313900840e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3369265515868993e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2230, - "real_time": 3.1406016162369034e+05, - "cpu_time": 5.6097060313902353e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3387743118352370e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1412560478136817e+05, - "cpu_time": 5.6105295156951086e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3380790915362759e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1410083705883042e+05, - "cpu_time": 5.6103797443949885e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3383419471868649e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1551415215967502e+02, - "cpu_time": 2.5455136435045000e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2275214014590541e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6773236693033357e-04, - "cpu_time": 4.5370292347336982e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6773286905377519e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1662, - "real_time": 4.2087782538444409e+05, - "cpu_time": 8.4782421239469515e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9828046846715918e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1662, - "real_time": 4.2140422475487262e+05, - "cpu_time": 8.4898413898915774e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9765803872039871e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1662, - "real_time": 4.2089256953905313e+05, - "cpu_time": 8.4873277858001564e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9826301336151590e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1662, - "real_time": 4.2107652273352974e+05, - "cpu_time": 8.4885550541515916e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9804534016424904e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1662, - "real_time": 4.2125558082833013e+05, - "cpu_time": 8.4926418592062942e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9783364196061068e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2110134464804595e+05, - "cpu_time": 8.4873216425993142e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9801610053478670e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2107652273352986e+05, - "cpu_time": 8.4885550541515904e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9804534016424904e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2895916296533704e+02, - "cpu_time": 5.4454759166843291e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7074466667766515e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.4371510771759651e-04, - "cpu_time": 6.4160121955936700e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4364641301140725e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1050, - "real_time": 6.6258198980774195e+05, - "cpu_time": 1.4673701304761944e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3302414863661470e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1050, - "real_time": 6.6279957941289817e+05, - "cpu_time": 1.4674667447618395e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3281633396859980e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1050, - "real_time": 6.6378458186851011e+05, - "cpu_time": 1.4704346961904471e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3187728587990227e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1050, - "real_time": 6.6272736726594821e+05, - "cpu_time": 1.4686691933333611e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3288528694739304e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1050, - "real_time": 6.6254282791522285e+05, - "cpu_time": 1.4677984666666687e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3306156572518082e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6288726925406430e+05, - "cpu_time": 1.4683478462857022e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3273292423153811e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6272736726594833e+05, - "cpu_time": 1.4677984666666687e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3288528694739304e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1241181155015920e+02, - "cpu_time": 1.2739988729012086e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8864748431727346e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7299992821821335e-04, - "cpu_time": 8.6764105393955914e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7228079273848724e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 603, - "real_time": 1.1583966578343022e+06, - "cpu_time": 2.7266371409618985e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2415678543850842e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 603, - "real_time": 1.1510806124206404e+06, - "cpu_time": 2.7235302437811908e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2875938570100279e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 603, - "real_time": 1.1631329308355083e+06, - "cpu_time": 2.7425624212272284e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2120802168108578e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 603, - "real_time": 1.1497886820926422e+06, - "cpu_time": 2.7178159519070946e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2957823734466906e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 603, - "real_time": 1.1519071621709126e+06, - "cpu_time": 2.7209053814262622e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2823646518445301e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1548612090708013e+06, - "cpu_time": 2.7262902278607348e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2638777906994390e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1519071621709128e+06, - "cpu_time": 2.7235302437811913e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2823646518445301e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.6936502565237206e+03, - "cpu_time": 9.6609013791964098e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5717083292125635e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9301597558245279e-03, - "cpu_time": 3.5436070893952931e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9170820767190293e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 318, - "real_time": 2.1999196256305906e+06, - "cpu_time": 5.3880467201258345e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6262858899633369e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 318, - "real_time": 2.1890364924106020e+06, - "cpu_time": 5.3610288899368392e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6642011488463860e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 318, - "real_time": 2.1883734778659241e+06, - "cpu_time": 5.3655296981134089e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6665231824875441e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 318, - "real_time": 2.1883094399206857e+06, - "cpu_time": 5.3615608836479103e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6667475330216932e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 318, - "real_time": 2.1988901634753314e+06, - "cpu_time": 5.3844032264152914e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6298563150983953e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1929058398606270e+06, - "cpu_time": 5.3721138836478572e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6507228138834724e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1890364924106020e+06, - "cpu_time": 5.3655296981134098e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6642011488463860e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.9507639698196563e+03, - "cpu_time": 1.3062136287914582e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0740556929409586e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7136431768533501e-03, - "cpu_time": 2.4314704734153783e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7109277690432719e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 151, - "real_time": 4.4291940893953210e+06, - "cpu_time": 1.1333258523178447e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.5757420701744165e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 151, - "real_time": 4.4124565697861034e+06, - "cpu_time": 1.1305205417218816e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6044787000875959e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 151, - "real_time": 4.6438055100622559e+06, - "cpu_time": 1.1635631834437182e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.2256324962993908e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 151, - "real_time": 4.5481205375137310e+06, - "cpu_time": 1.1502553304635150e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.3776479148335886e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 151, - "real_time": 4.3839444714715546e+06, - "cpu_time": 1.1273503668873660e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.6539363621859055e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4835042356457943e+06, - "cpu_time": 1.1410030549668651e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.4874875087161789e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.4291940893953210e+06, - "cpu_time": 1.1333258523178447e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.5757420701744165e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0929464133581097e+05, - "cpu_time": 1.5409270058957548e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8014841881781811e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4377057674412662e-02, - "cpu_time": 1.3505020860268453e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4059929129512065e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 73, - "real_time": 9.5608487903867681e+06, - "cpu_time": 2.3934927767122459e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0191324506121826e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 73, - "real_time": 9.5420455151837170e+06, - "cpu_time": 2.3923805273972765e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0329641472798958e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 73, - "real_time": 9.5218195490641128e+06, - "cpu_time": 2.3893003643836092e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0479033607180719e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 73, - "real_time": 9.6007373745310791e+06, - "cpu_time": 2.4009589863012854e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 6.9899697681583271e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 73, - "real_time": 9.5614339671518710e+06, - "cpu_time": 2.3931863123288140e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0187028672217226e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5573770392635092e+06, - "cpu_time": 2.3938637934246462e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0217345187980413e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5608487903867681e+06, - "cpu_time": 2.3931863123288143e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0191324506121826e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9189129544120813e+04, - "cpu_time": 4.3000976360138782e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1423549522254243e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0540941750237913e-03, - "cpu_time": 1.7963000433964479e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0510338243208688e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 40, - "real_time": 1.7299412097781897e+07, - "cpu_time": 4.4177811525000267e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7585138293346500e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 40, - "real_time": 1.7305688327178359e+07, - "cpu_time": 4.4229356424997941e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7557000601480150e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 40, - "real_time": 1.7284279828891158e+07, - "cpu_time": 4.4154647050001472e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7653063551801157e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 40, - "real_time": 1.7170606972649693e+07, - "cpu_time": 4.4104581150000401e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8167142381040773e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 40, - "real_time": 1.7154122889041901e+07, - "cpu_time": 4.4113181525000297e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8242256318298063e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7242822023108605e+07, - "cpu_time": 4.4155915535000078e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7840920229193335e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7284279828891158e+07, - "cpu_time": 4.4154647050001472e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7653063551801157e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4087631045894348e+04, - "cpu_time": 5.0833115311385118e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3496881710143708e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2967230623040175e-03, - "cpu_time": 1.1512186916630086e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3032484214621464e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 17, - "real_time": 4.1273444233571783e+07, - "cpu_time": 8.4211814588236257e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.5038297865544949e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 17, - "real_time": 4.1263732182628967e+07, - "cpu_time": 8.4346212529413506e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.5053605624409523e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 17, - "real_time": 4.1144775117144868e+07, - "cpu_time": 8.4330694588235185e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.5241687489049854e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 17, - "real_time": 4.1191807564567119e+07, - "cpu_time": 8.4200293000000834e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.5167195098014135e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 17, - "real_time": 4.1226329172358796e+07, - "cpu_time": 8.4226497352942184e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.5112626175793295e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1220017654054306e+07, - "cpu_time": 8.4263102411765605e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.5122682450562363e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1226329172358796e+07, - "cpu_time": 8.4226497352942199e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.5112626175793295e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3062329340356271e+04, - "cpu_time": 6.9626480878010625e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.3870539708004743e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2872951628912558e-03, - "cpu_time": 8.2629856823653730e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2878852122173367e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 6.6880545020103455e+07, - "cpu_time": 1.5970405499999744e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.0273106602020559e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 6.7158274352550507e+07, - "cpu_time": 1.6032483320000210e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.9941141605525923e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 6.7085506021976471e+07, - "cpu_time": 1.6001286309999615e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.0027854574746294e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 6.6980416327714920e+07, - "cpu_time": 1.5986131290000004e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.0153415197250042e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 6.7162881046533585e+07, - "cpu_time": 1.6028053410000211e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 7.9935658452178478e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7053524553775787e+07, - "cpu_time": 1.6003671965999955e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.0066235286344271e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7085506021976471e+07, - "cpu_time": 1.6001286309999615e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.0027854574746294e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2167673251917050e+05, - "cpu_time": 2.6667270952398289e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4540279891754491e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8146209812071523e-03, - "cpu_time": 1.6663220171628929e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8160314194558382e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.2794494628906250e+08, - "cpu_time": 3.1568932760001189e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.3922175524942160e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.2781183123588562e+08, - "cpu_time": 3.1634968599998957e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.4009579834462652e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.2740846574306488e+08, - "cpu_time": 3.1567537119999540e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.4275547761899500e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.2759979367256165e+08, - "cpu_time": 3.1546237360000759e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.4149181836090345e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.2755151093006134e+08, - "cpu_time": 3.1573488279998404e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.4181035267292986e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2766330957412723e+08, - "cpu_time": 3.1578232823999774e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.4107504044937534e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2759979367256165e+08, - "cpu_time": 3.1568932760001189e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.4149181836090345e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1380862236523614e+05, - "cpu_time": 3.3414285740206449e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4081759572962465e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6747852071083036e-03, - "cpu_time": 1.0581429912952969e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6742572179337014e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3485, - "real_time": 2.0080205338116511e+05, - "cpu_time": 2.7915876499282679e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0995494456235943e+06, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3485, - "real_time": 2.0015158207313434e+05, - "cpu_time": 2.7884251621234836e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1161224377723671e+06, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3485, - "real_time": 2.0005874890033048e+05, - "cpu_time": 2.7886665595407656e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1184964698052676e+06, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3485, - "real_time": 2.0041809518106008e+05, - "cpu_time": 2.7892468436157668e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1093190915466305e+06, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3485, - "real_time": 2.0010823854014755e+05, - "cpu_time": 2.7937294863699772e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1172305921555338e+06, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0030774361516754e+05, - "cpu_time": 2.7903311403156526e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1121436073806789e+06, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0015158207313437e+05, - "cpu_time": 2.7892468436157668e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1161224377723671e+06, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0931645731510372e+02, - "cpu_time": 2.2752391998057828e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8844493534073326e+03, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5442061886002988e-03, - "cpu_time": 8.1540114251400255e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5422980962475556e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3495, - "real_time": 2.0056898515466307e+05, - "cpu_time": 2.7918096652361710e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0210950603458172e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3495, - "real_time": 2.0025374459599721e+05, - "cpu_time": 2.7934071359086299e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0227024738697128e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3495, - "real_time": 1.9992279693736121e+05, - "cpu_time": 2.7882306723891082e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0243954323236428e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3495, - "real_time": 2.0041635651950815e+05, - "cpu_time": 2.7895563118743431e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0218726832311470e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3495, - "real_time": 2.0061481456093767e+05, - "cpu_time": 2.7956992217453435e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0208617965139911e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0035533955369348e+05, - "cpu_time": 2.7917406014307193e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0221854892568622e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0041635651950815e+05, - "cpu_time": 2.7918096652361716e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0218726832311470e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8022733748810202e+02, - "cpu_time": 2.9809186717114102e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4309233685014155e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3986517060754627e-03, - "cpu_time": 1.0677634842519899e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3998666421509362e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3516, - "real_time": 2.0052282208461841e+05, - "cpu_time": 2.7935471217293770e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0426602605221331e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3516, - "real_time": 2.0026916875946309e+05, - "cpu_time": 2.7959864306029293e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0452474164505944e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3516, - "real_time": 2.0050198201200552e+05, - "cpu_time": 2.8039524032991909e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0428725735762265e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3516, - "real_time": 2.0068300612399564e+05, - "cpu_time": 2.8005026734925807e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0410298206661366e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3516, - "real_time": 2.0065711368104725e+05, - "cpu_time": 2.7968735836177942e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0412931915839080e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0052681853222597e+05, - "cpu_time": 2.7981724425483739e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0426206525597997e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0052282208461844e+05, - "cpu_time": 2.7968735836177936e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0426602605221331e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6461137519889937e+02, - "cpu_time": 4.0834176239186797e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6776337716781334e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.2089456364882810e-04, - "cpu_time": 1.4593159312939973e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2131440782983031e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3476, - "real_time": 2.0126281829782086e+05, - "cpu_time": 2.8160167894131865e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0702997549591094e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3476, - "real_time": 2.0141665820257820e+05, - "cpu_time": 2.8146527502876078e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0671909032274567e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3476, - "real_time": 2.0093651105719697e+05, - "cpu_time": 2.8105014729575254e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0769096451904304e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3476, - "real_time": 2.0099372598528137e+05, - "cpu_time": 2.8110332278478646e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0757491109945856e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3476, - "real_time": 2.0159106222839392e+05, - "cpu_time": 2.8123433515535283e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0636722230863690e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0124015515425432e+05, - "cpu_time": 2.8129095184119430e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0707643274915904e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0126281829782089e+05, - "cpu_time": 2.8123433515535283e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0702997549591094e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7736699145763038e+02, - "cpu_time": 2.3629263926964830e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6101722277484492e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3782884993555260e-03, - "cpu_time": 8.4002929252786560e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3781618822442231e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3457, - "real_time": 2.0237318604472259e+05, - "cpu_time": 2.8463804483657709e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0959342095742315e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3457, - "real_time": 2.0290757513946932e+05, - "cpu_time": 2.8462026468036254e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0746122902205080e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3457, - "real_time": 2.0238110452601060e+05, - "cpu_time": 2.8397510992191563e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0956174433242515e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3457, - "real_time": 2.0241456371480838e+05, - "cpu_time": 2.8403203210878582e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0942792353045329e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3457, - "real_time": 2.0276386614104678e+05, - "cpu_time": 2.8382572779868642e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0803351759938076e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0256805911321155e+05, - "cpu_time": 2.8421823586926551e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0881556708834663e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0241456371480841e+05, - "cpu_time": 2.8403203210878582e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0942792353045329e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5004994102858387e+02, - "cpu_time": 3.8265891671733482e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9782896016802406e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2343996488056175e-03, - "cpu_time": 1.3463559632160616e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2336915865258458e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3422, - "real_time": 2.0444459151022119e+05, - "cpu_time": 2.8828863559322560e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6027814557452729e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3422, - "real_time": 2.0497547109237252e+05, - "cpu_time": 2.8832005581529310e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5986303056346214e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3422, - "real_time": 2.0444487397556810e+05, - "cpu_time": 2.8804225482172763e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6027792413086325e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3422, - "real_time": 2.0419870614440084e+05, - "cpu_time": 2.8766496960844134e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6047114410621107e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3422, - "real_time": 2.0478942960192225e+05, - "cpu_time": 2.8789291057861352e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6000825854974899e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0457061446489699e+05, - "cpu_time": 2.8804176528346026e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6017970058496255e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0444487397556810e+05, - "cpu_time": 2.8804225482172763e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6027792413086325e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0894870431733710e+02, - "cpu_time": 2.7501068772168685e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4184234584745494e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5102301233511264e-03, - "cpu_time": 9.5475976357473850e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5098189406289773e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3389, - "real_time": 2.0812254914119135e+05, - "cpu_time": 2.9744247831220750e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1489139581670249e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3389, - "real_time": 2.0783879797976173e+05, - "cpu_time": 2.9766378164651175e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1532130014715326e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3389, - "real_time": 2.0772479453161065e+05, - "cpu_time": 2.9745983771024022e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1549435467140162e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3389, - "real_time": 2.0801358668859248e+05, - "cpu_time": 2.9722781616993988e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1505634340179384e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3389, - "real_time": 2.0779892602831282e+05, - "cpu_time": 2.9757170345234947e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1538180322967911e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0789973087389380e+05, - "cpu_time": 2.9747312345824979e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1522903945334607e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0783879797976173e+05, - "cpu_time": 2.9745983771024027e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1532130014715326e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6362173228015962e+02, - "cpu_time": 1.6382907382248715e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4802627054406959e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8702233808762350e-04, - "cpu_time": 5.5073571661838042e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8681288682725401e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3246, - "real_time": 2.1551860806197091e+05, - "cpu_time": 3.1574684134318231e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0817022334475708e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3246, - "real_time": 2.1515833288791962e+05, - "cpu_time": 3.1535826032038755e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0918858331309938e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3246, - "real_time": 2.1541775726872907e+05, - "cpu_time": 3.1567870271103596e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0845494662025690e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3246, - "real_time": 2.1549578497441081e+05, - "cpu_time": 3.1566859981514903e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0823463445266092e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3246, - "real_time": 2.1539379650024261e+05, - "cpu_time": 3.1559326956252963e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0852263217270684e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1539685593865463e+05, - "cpu_time": 3.1560913475045690e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0851420398069632e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1541775726872907e+05, - "cpu_time": 3.1566859981514903e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.0845494662025690e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4313455656255158e+02, - "cpu_time": 1.5043984236305081e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0461455475551047e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.6451553314834152e-04, - "cpu_time": 4.7666504482514211e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6492212031971879e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3050, - "real_time": 2.2962554130363508e+05, - "cpu_time": 3.4656053868852946e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1416151640263989e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3050, - "real_time": 2.2983291027991130e+05, - "cpu_time": 3.4701554065573780e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1405851306531224e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3050, - "real_time": 2.2918744806150647e+05, - "cpu_time": 3.4641590786886960e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1437973685611660e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3050, - "real_time": 2.2949039910778738e+05, - "cpu_time": 3.4704308163934940e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1422874378151035e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3050, - "real_time": 2.2972175167285700e+05, - "cpu_time": 3.4764188360653503e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1411370411858735e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2957161008513946e+05, - "cpu_time": 3.4693539049180422e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1418844284483330e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2962554130363511e+05, - "cpu_time": 3.4701554065573786e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1416151640263989e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4895006915869664e+02, - "cpu_time": 4.8154180069977173e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2390542998916553e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0844113915756850e-03, - "cpu_time": 1.3879869678822729e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0850960649103193e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2710, - "real_time": 2.5812380600718924e+05, - "cpu_time": 4.1796564981547993e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0311493469354684e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2710, - "real_time": 2.5820899733283810e+05, - "cpu_time": 4.1796571439115598e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0304792064398098e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2710, - "real_time": 2.5809917681011959e+05, - "cpu_time": 4.1858128929888859e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0313431700160449e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2710, - "real_time": 2.5774983848561964e+05, - "cpu_time": 4.1779969151291618e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0340963279759769e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2710, - "real_time": 2.5865051351320959e+05, - "cpu_time": 4.1925271992619196e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0270131803671210e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5816646642979528e+05, - "cpu_time": 4.1831301298892649e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0308162463468843e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5812380600718927e+05, - "cpu_time": 4.1796571439115598e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0311493469354684e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2250469184838448e+02, - "cpu_time": 6.0411044816443518e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5359636628311533e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2492121703811022e-03, - "cpu_time": 1.4441588700479348e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2487410751184154e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2224, - "real_time": 3.1490143189441646e+05, - "cpu_time": 5.6572234262590285e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3298546586208534e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2224, - "real_time": 3.1543302113094396e+05, - "cpu_time": 5.6683844244603219e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3242429604879904e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2224, - "real_time": 3.1513107468716620e+05, - "cpu_time": 5.6651856205036410e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3274281219042964e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2224, - "real_time": 3.1461373595016246e+05, - "cpu_time": 5.6564868165468413e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3328996168371472e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2224, - "real_time": 3.1456553881607694e+05, - "cpu_time": 5.6524666456834564e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3334102773828983e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1492896049575321e+05, - "cpu_time": 5.6599493866906583e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3295671270466371e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1490143189441646e+05, - "cpu_time": 5.6572234262590273e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3298546586208534e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6301753594029549e+02, - "cpu_time": 6.5950677015003203e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8366671626712685e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1526965807426618e-03, - "cpu_time": 1.1652167273807409e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1523020910151869e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1651, - "real_time": 4.2469156237554905e+05, - "cpu_time": 8.5358081284072774e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9380590192783642e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1651, - "real_time": 4.2500264581554040e+05, - "cpu_time": 8.5431956753480446e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9344445749879065e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1651, - "real_time": 4.2430895078108774e+05, - "cpu_time": 8.5278771168985555e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9425118092358513e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1651, - "real_time": 4.2456032932585932e+05, - "cpu_time": 8.5325266020593152e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9395853902082081e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1651, - "real_time": 4.2404651717011502e+05, - "cpu_time": 8.5168798667474079e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9455706274759569e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2452200109363039e+05, - "cpu_time": 8.5312574778921215e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9400342842372570e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2456032932585932e+05, - "cpu_time": 8.5325266020593140e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9395853902082081e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6493657924141343e+02, - "cpu_time": 9.7849654754979497e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2466826353566851e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.5964114533824813e-04, - "cpu_time": 1.1469546547920612e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5964638927852591e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1049, - "real_time": 6.6632616768251068e+05, - "cpu_time": 1.4739079485223831e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2946709936183844e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1049, - "real_time": 6.6593523570971203e+05, - "cpu_time": 1.4727608303145808e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2983662300583544e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1049, - "real_time": 6.6593890018438001e+05, - "cpu_time": 1.4748718674927771e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2983315719185562e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1049, - "real_time": 6.6587864837473398e+05, - "cpu_time": 1.4727349580553537e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2989014743713303e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1049, - "real_time": 6.6618250035507709e+05, - "cpu_time": 1.4732616167777826e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2960284873355646e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6605229046128283e+05, - "cpu_time": 1.4735074442325756e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2972597514604378e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6593890018437989e+05, - "cpu_time": 1.4732616167777828e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2983315719185562e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9279139800689853e+02, - "cpu_time": 8.9953500359016778e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8225001159506135e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8945384734489613e-04, - "cpu_time": 6.1047197766866989e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8941161519150386e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 607, - "real_time": 1.1526906170116668e+06, - "cpu_time": 2.7282133822076432e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2774150116250114e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 607, - "real_time": 1.1496033540219560e+06, - "cpu_time": 2.7213565436573634e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2969585297850380e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 607, - "real_time": 1.1531745545455613e+06, - "cpu_time": 2.7282364102141834e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2743609949889603e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 607, - "real_time": 1.1487765632005166e+06, - "cpu_time": 2.7196201285008141e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3022102545591240e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 607, - "real_time": 1.1508957831161418e+06, - "cpu_time": 2.7230905337725249e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2887642157200165e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1510281743791683e+06, - "cpu_time": 2.7241033996705059e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2879418013356295e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1508957831161418e+06, - "cpu_time": 2.7230905337725254e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2887642157200165e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9031590002849614e+03, - "cpu_time": 3.9574160845692904e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2050084205382135e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6534425852012449e-03, - "cpu_time": 1.4527407752025713e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6534276115066902e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 319, - "real_time": 2.1886931532310750e+06, - "cpu_time": 5.4131615768024223e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6654034281747112e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 319, - "real_time": 2.1891596210320541e+06, - "cpu_time": 5.4138807711599907e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6637700781684313e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 319, - "real_time": 2.1886846151343053e+06, - "cpu_time": 5.4145269749215655e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6654333310468721e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 319, - "real_time": 2.1871623603574536e+06, - "cpu_time": 5.4118039498432949e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6707684368059702e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 319, - "real_time": 2.1881013167116991e+06, - "cpu_time": 5.4135445830718856e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6674767625536518e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1883602132933172e+06, - "cpu_time": 5.4133835711598312e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6665704073499269e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1886846151343053e+06, - "cpu_time": 5.4135445830718856e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6654333310468721e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6762904183569867e+02, - "cpu_time": 1.0155035497814446e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6898679128908915e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5077819326667192e-04, - "cpu_time": 1.8759127936021543e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5085674166797191e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 167, - "real_time": 4.1918629769258155e+06, - "cpu_time": 1.1019270419161374e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 8.0046585932557831e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 167, - "real_time": 4.1967569487894364e+06, - "cpu_time": 1.1025201538922386e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.9953241060764427e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 167, - "real_time": 4.1942400551083204e+06, - "cpu_time": 1.1025457227545107e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 8.0001219670611877e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 167, - "real_time": 4.1903425509968917e+06, - "cpu_time": 1.1009973988023888e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 8.0075630074723425e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 167, - "real_time": 4.1937408522663717e+06, - "cpu_time": 1.1016616994011801e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 8.0010742632956429e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1933886768173673e+06, - "cpu_time": 1.1019304033532912e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 8.0017483874322805e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1937408522663713e+06, - "cpu_time": 1.1019270419161374e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 8.0010742632956429e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4393017082159140e+03, - "cpu_time": 6.4597489656612015e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6543039660082366e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8170179208554950e-04, - "cpu_time": 5.8622113937536352e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8166087468063696e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 77, - "real_time": 8.9965790219895244e+06, - "cpu_time": 2.3020430675324127e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4593758178494148e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 77, - "real_time": 8.9818630004664529e+06, - "cpu_time": 2.3004991337662525e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4715973731190128e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 77, - "real_time": 8.9831992064590584e+06, - "cpu_time": 2.2994010857143044e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4704860103455906e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 77, - "real_time": 8.9640903782534916e+06, - "cpu_time": 2.2965188883116245e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4864109093325634e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 77, - "real_time": 8.9814930476925597e+06, - "cpu_time": 2.2992058999999575e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4719051324368591e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9814449309722167e+06, - "cpu_time": 2.2995336150649101e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4719550486166887e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9818630004664510e+06, - "cpu_time": 2.2994010857143041e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.4715973731190128e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1548547427738880e+04, - "cpu_time": 2.0275056497050733e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6111582619370073e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2858228844574990e-03, - "cpu_time": 8.8170298377997062e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2862976556204467e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 34, - "real_time": 2.0327668089200467e+07, - "cpu_time": 4.3194174794116274e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 6.6027115068504190e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 34, - "real_time": 2.0321945605032586e+07, - "cpu_time": 4.3086795499999985e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 6.6045707733201466e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 34, - "real_time": 2.0332195467370398e+07, - "cpu_time": 4.3084213852941558e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 6.6012412784146147e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 34, - "real_time": 2.0321625777903724e+07, - "cpu_time": 4.3039923999996893e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 6.6046747178042574e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 34, - "real_time": 2.0316670758321006e+07, - "cpu_time": 4.3113545323528931e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 6.6062855276142654e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0324021139565639e+07, - "cpu_time": 4.3103730694116727e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 6.6038967608007412e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0321945605032586e+07, - "cpu_time": 4.3086795499999985e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 6.6045707733201466e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.0040316139966862e+03, - "cpu_time": 5.7042668843939566e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9507774400992030e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9541553675657136e-04, - "cpu_time": 1.3233812462484914e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9539793106375965e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 21, - "real_time": 3.2818753804479327e+07, - "cpu_time": 8.1138945238097087e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1793311714158421e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 21, - "real_time": 3.2742319362504143e+07, - "cpu_time": 8.0994951285717994e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1984251948689680e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 21, - "real_time": 3.2775835976714179e+07, - "cpu_time": 8.1025270571428463e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1900414741735907e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 21, - "real_time": 3.2792750213827405e+07, - "cpu_time": 8.1042634571428522e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1858171165775347e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 21, - "real_time": 3.2716170308135804e+07, - "cpu_time": 8.0899429238094121e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.2049779504065580e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2769165933132172e+07, - "cpu_time": 8.1020246180953234e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1917185814884987e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2775835976714183e+07, - "cpu_time": 8.1025270571428463e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.1900414741735907e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0586141062192684e+04, - "cpu_time": 8.6389403445088828e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0147381836276785e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2385466613648822e-03, - "cpu_time": 1.0662693279423509e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2387366259392332e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 6.4500274509191513e+07, - "cpu_time": 1.6061778570000345e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.3235446063643351e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 6.4820358902215958e+07, - "cpu_time": 1.6100060370000619e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2824427555220842e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 6.4877221733331680e+07, - "cpu_time": 1.6117376739999825e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2751834566333504e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 6.4562387019395828e+07, - "cpu_time": 1.6072487260000798e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.3155369060117502e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 6.4806582033634186e+07, - "cpu_time": 1.6079729230000338e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2842034736744423e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4713364839553833e+07, - "cpu_time": 1.6086286434000385e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2961822396411934e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4806582033634186e+07, - "cpu_time": 1.6079729230000338e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2842034736744423e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6969682335781684e+05, - "cpu_time": 2.2306826115188195e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1774499814423293e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6222840332681243e-03, - "cpu_time": 1.3866983039690203e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6246409716483075e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6, - "real_time": 1.2326131264368694e+08, - "cpu_time": 3.1474746216667885e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.7111016503927670e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6, - "real_time": 1.2375142176946004e+08, - "cpu_time": 3.1616556033333153e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.6766019222009697e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6, - "real_time": 1.2354011585315068e+08, - "cpu_time": 3.1582175049999249e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.6914425859559040e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6, - "real_time": 1.2384483839074771e+08, - "cpu_time": 3.1626188733334476e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.6700571291650848e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6, - "real_time": 1.2376265103618304e+08, - "cpu_time": 3.1630171233335131e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.6758146743809052e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2363206793864569e+08, - "cpu_time": 3.1585967453333986e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.6850035924191265e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2375142176946005e+08, - "cpu_time": 3.1616556033333153e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 8.6766019222009697e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3584063599124807e+05, - "cpu_time": 6.4984483851287910e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6590587005600495e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9076008346660318e-03, - "cpu_time": 2.0573846264895276e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9102567810198616e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3533, - "real_time": 1.9760566381910254e+05, - "cpu_time": 2.7412819869797578e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1820377018009843e+06, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3533, - "real_time": 1.9766082432214750e+05, - "cpu_time": 2.7443727285593329e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1805915689751720e+06, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3533, - "real_time": 1.9805392259331868e+05, - "cpu_time": 2.7457003679591056e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1703091087100971e+06, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3533, - "real_time": 1.9789545625236552e+05, - "cpu_time": 2.7387987461080035e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1744492743388079e+06, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3533, - "real_time": 1.9760063805383706e+05, - "cpu_time": 2.7399639796205657e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1821695015023546e+06, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9776330100815426e+05, - "cpu_time": 2.7420235618453531e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1779114310654830e+06, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9766082432214750e+05, - "cpu_time": 2.7412819869797578e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1805915689751720e+06, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0232159149286338e+02, - "cpu_time": 2.9252664928209026e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2943896635192696e+03, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0230492232960915e-03, - "cpu_time": 1.0668276281521917e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0224952153014750e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3537, - "real_time": 1.9811669761081433e+05, - "cpu_time": 2.7447950918859348e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0337341701622471e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3537, - "real_time": 1.9756897623448772e+05, - "cpu_time": 2.7406041899916314e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0365999961296050e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3537, - "real_time": 1.9769097690804655e+05, - "cpu_time": 2.7421216284986178e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0359602810565306e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3537, - "real_time": 1.9811221673998560e+05, - "cpu_time": 2.7415167514844035e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0337575509984417e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3537, - "real_time": 1.9757702536082486e+05, - "cpu_time": 2.7395979474129650e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0365577658940060e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9781317857083183e+05, - "cpu_time": 2.7417271218547103e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0353219528481662e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9769097690804658e+05, - "cpu_time": 2.7415167514844035e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0359602810565306e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7923287783682753e+02, - "cpu_time": 1.9625679013961866e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4608643348657713e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4115989634979824e-03, - "cpu_time": 7.1581445350715929e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4110242044486161e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3569, - "real_time": 1.9819057637822477e+05, - "cpu_time": 2.7451357747270889e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0666976578055043e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3569, - "real_time": 1.9755066497399218e+05, - "cpu_time": 2.7414452255532856e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0733921602031782e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3569, - "real_time": 1.9798884056793628e+05, - "cpu_time": 2.7453280190530908e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0688034680391658e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3569, - "real_time": 1.9751595916583613e+05, - "cpu_time": 2.7407670411880658e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0737564788681012e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3569, - "real_time": 1.9820469868373053e+05, - "cpu_time": 2.7430939030538342e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0665504032958712e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9789014795394399e+05, - "cpu_time": 2.7431539927150740e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0698400336423643e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9798884056793628e+05, - "cpu_time": 2.7430939030538348e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0688034680391658e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3697387680762932e+02, - "cpu_time": 2.0781532683828590e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5258618901979127e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7028330126169545e-03, - "cpu_time": 7.5757805573502593e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7034465624830629e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3517, - "real_time": 1.9868515928276279e+05, - "cpu_time": 2.7642067728175706e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1231061391663328e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3517, - "real_time": 1.9922799084537217e+05, - "cpu_time": 2.7633151862381212e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1118720141880564e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3517, - "real_time": 1.9860112896485149e+05, - "cpu_time": 2.7602036479952384e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1248506706373379e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3517, - "real_time": 1.9866819189855989e+05, - "cpu_time": 2.7631599346032692e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1234582756875552e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3517, - "real_time": 1.9917812674869178e+05, - "cpu_time": 2.7660437873190182e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1129014183048621e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9887211954804760e+05, - "cpu_time": 2.7633858657946438e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1192377035968296e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9868515928276282e+05, - "cpu_time": 2.7633151862381212e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1231061391663328e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0424550542816507e+02, - "cpu_time": 2.1166592656160023e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2985179457154838e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5298549948559240e-03, - "cpu_time": 7.6596587245239176e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5290494015957742e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3501, - "real_time": 1.9975052384178957e+05, - "cpu_time": 2.7869916423879215e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2022313057745904e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3501, - "real_time": 2.0027814846018597e+05, - "cpu_time": 2.7881212510711385e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1806228617382273e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3501, - "real_time": 2.0033897699958997e+05, - "cpu_time": 2.7925116680948326e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1781389949063852e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3501, - "real_time": 1.9996984720320415e+05, - "cpu_time": 2.7894291116826539e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1932352447871834e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3501, - "real_time": 1.9982113045770902e+05, - "cpu_time": 2.7871382005141809e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1993330547529742e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0003172539249572e+05, - "cpu_time": 2.7888383747501456e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1907122923918724e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9996984720320418e+05, - "cpu_time": 2.7881212510711385e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.1932352447871834e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6569782054409461e+02, - "cpu_time": 2.2725169600671788e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0877211525708232e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3282784019522454e-03, - "cpu_time": 8.1486147804129216e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3279933585033593e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3462, - "real_time": 2.0244368031702490e+05, - "cpu_time": 2.8407116637782584e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6186230140000230e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3462, - "real_time": 2.0202921817805117e+05, - "cpu_time": 2.8356010774119297e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6219436126868096e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3462, - "real_time": 2.0243250794329689e+05, - "cpu_time": 2.8350825621029967e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6187123467925715e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3462, - "real_time": 2.0199603106000539e+05, - "cpu_time": 2.8360905805892509e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6222100913589665e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3462, - "real_time": 2.0194246667901438e+05, - "cpu_time": 2.8349148469091876e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6226403756909844e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0216878083547857e+05, - "cpu_time": 2.8364801461583248e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6208258881058714e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0202921817805120e+05, - "cpu_time": 2.8356010774119297e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6219436126868096e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4782051468864202e+02, - "cpu_time": 2.4100657400825122e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9860389777141839e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2258100071856001e-03, - "cpu_time": 8.4966776282452048e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2253253062456373e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3402, - "real_time": 2.0561086562522926e+05, - "cpu_time": 2.9295617783658032e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1873801902791309e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3402, - "real_time": 2.0611660327204721e+05, - "cpu_time": 2.9277957554380584e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1795594803928030e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3402, - "real_time": 2.0543577094998446e+05, - "cpu_time": 2.9271712904174550e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1900968218409950e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3402, - "real_time": 2.0537900631977813e+05, - "cpu_time": 2.9258714726632705e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1909785315622514e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3402, - "real_time": 2.0602037353548707e+05, - "cpu_time": 2.9280260317463265e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1810446158962727e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0571252394050526e+05, - "cpu_time": 2.9276852657261828e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1858119279942912e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0561086562522926e+05, - "cpu_time": 2.9277957554380584e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1873801902791309e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3771737943187111e+02, - "cpu_time": 1.3419803503618266e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2281430722580652e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6416957653465154e-03, - "cpu_time": 4.5837589377250285e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6410708448660921e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3322, - "real_time": 2.1062315380288914e+05, - "cpu_time": 3.0889122636964777e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2230575144963992e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3322, - "real_time": 2.1080111878496397e+05, - "cpu_time": 3.0907388199877995e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2178038122134054e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3322, - "real_time": 2.1067290398003344e+05, - "cpu_time": 3.0916515291992825e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2215879462326288e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3322, - "real_time": 2.1054566044316668e+05, - "cpu_time": 3.0875165382301231e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2253479707970870e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3322, - "real_time": 2.1084394076110038e+05, - "cpu_time": 3.0948730764599069e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2165409888877439e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1069735555443075e+05, - "cpu_time": 3.0907384455147182e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2208676465254533e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1067290398003341e+05, - "cpu_time": 3.0907388199877995e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.2215879462326288e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2386405549733517e+02, - "cpu_time": 2.8126731766699777e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6570037604574597e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8787664976334554e-04, - "cpu_time": 9.1003274015364537e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8786072429944870e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3071, - "real_time": 2.2663909028936573e+05, - "cpu_time": 3.4183447248452465e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1566583666802700e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3071, - "real_time": 2.2718808255771716e+05, - "cpu_time": 3.4231483490719897e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1538633411081424e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3071, - "real_time": 2.2690250962271041e+05, - "cpu_time": 3.4178416541843279e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1553155601314790e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3071, - "real_time": 2.2711326294024094e+05, - "cpu_time": 3.4230806512536644e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1542434669215090e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3071, - "real_time": 2.2671218655446378e+05, - "cpu_time": 3.4210450146533101e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1562854383084710e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2691102639289960e+05, - "cpu_time": 3.4206920788017078e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1552732346299741e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2690250962271038e+05, - "cpu_time": 3.4210450146533101e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1553155601314790e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4042608048654407e+02, - "cpu_time": 2.5247820111128604e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2240465482652201e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0595610284281339e-03, - "cpu_time": 7.3809099239277598e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0595299116899161e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2738, - "real_time": 2.5568505285826148e+05, - "cpu_time": 4.1506925566105230e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0505226806927898e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2738, - "real_time": 2.5561048685689713e+05, - "cpu_time": 4.1487544046751037e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0511208536350908e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2738, - "real_time": 2.5560067432719620e+05, - "cpu_time": 4.1458881775017007e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0511995963236592e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2738, - "real_time": 2.5531058977364845e+05, - "cpu_time": 4.1453524068661174e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0535301746191559e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2738, - "real_time": 2.5573401069896156e+05, - "cpu_time": 4.1502154638422059e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0501301276550500e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5558816290299300e+05, - "cpu_time": 4.1481806018991309e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0513006865851490e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5561048685689713e+05, - "cpu_time": 4.1487544046751043e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0511208536350908e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6459114480342313e+02, - "cpu_time": 2.4512102108981321e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3218053378012967e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.4397013904706043e-04, - "cpu_time": 5.9091212416737904e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4437424822478791e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2216, - "real_time": 3.1450123509660276e+05, - "cpu_time": 5.6197004648013774e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3340918348950763e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2216, - "real_time": 3.1459509016923263e+05, - "cpu_time": 5.6250794494584727e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3330971549363060e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2216, - "real_time": 3.1418425556031032e+05, - "cpu_time": 5.6165599232852587e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3374555899689794e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2216, - "real_time": 3.1441985801547777e+05, - "cpu_time": 5.6206390433209273e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3349547532343912e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2216, - "real_time": 3.1438137165380857e+05, - "cpu_time": 5.6189384476533672e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3353630162116413e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1441636209908646e+05, - "cpu_time": 5.6201834657038806e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3349924698492789e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1441985801547777e+05, - "cpu_time": 5.6197004648013762e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3349547532343912e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5350663391717407e+02, - "cpu_time": 3.1261648774793173e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6285768192873187e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.8822724393966929e-04, - "cpu_time": 5.5623893713722245e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8832998395373296e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1659, - "real_time": 4.2161622013873683e+05, - "cpu_time": 8.5006882157930429e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9740780829302816e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1659, - "real_time": 4.2168758238015685e+05, - "cpu_time": 8.4995099276668392e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9732363190846586e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1659, - "real_time": 4.2115473548793007e+05, - "cpu_time": 8.4887914406270103e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9795284803585033e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1659, - "real_time": 4.2102800490196532e+05, - "cpu_time": 8.4943565461123467e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9810273321089735e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1659, - "real_time": 4.2131280774155754e+05, - "cpu_time": 8.4975822664254077e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9776602122346087e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2135987013006938e+05, - "cpu_time": 8.4961856793249305e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9771060853434057e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2131280774155754e+05, - "cpu_time": 8.4975822664254101e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9776602122346087e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8615566799462533e+02, - "cpu_time": 4.7774054521776668e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3799082795602605e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7912416031999461e-04, - "cpu_time": 5.6230002880036612e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7909106649613569e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1051, - "real_time": 6.6249836556352919e+05, - "cpu_time": 1.4683586945766730e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3310405248053312e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1051, - "real_time": 6.6276431204635929e+05, - "cpu_time": 1.4680051950523404e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3285000772742491e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1051, - "real_time": 6.6641743016206822e+05, - "cpu_time": 1.4725191417697468e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2938089704225969e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1051, - "real_time": 6.6251451317726017e+05, - "cpu_time": 1.4684211217887131e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3308862169450855e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1051, - "real_time": 6.6302271911406540e+05, - "cpu_time": 1.4698274529020635e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3260336019924812e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6344346801265655e+05, - "cpu_time": 1.4694263212179074e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3220538782879496e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6276431204635941e+05, - "cpu_time": 1.4684211217887134e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3285000772742491e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6762241089656557e+03, - "cpu_time": 1.8638869139216390e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5921184976039942e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5265515296831265e-03, - "cpu_time": 1.2684453020936702e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5183564206433962e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 606, - "real_time": 1.1491197364623027e+06, - "cpu_time": 2.7291649521451010e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3000295215756140e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 606, - "real_time": 1.1461583869424174e+06, - "cpu_time": 2.7221352112211483e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3188907358415918e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 606, - "real_time": 1.1493882428310665e+06, - "cpu_time": 2.7291929554455085e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2983241757701988e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 606, - "real_time": 1.1461797843090945e+06, - "cpu_time": 2.7236573300330192e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3187541037085800e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 606, - "real_time": 1.1491918073438427e+06, - "cpu_time": 2.7298052904291539e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2995717045606251e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1480075915777448e+06, - "cpu_time": 2.7267911478547859e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3071140482913227e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1491197364623027e+06, - "cpu_time": 2.7291649521451006e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3000295215756140e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6812100033599600e+03, - "cpu_time": 3.6051089458890083e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0706546903692152e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4644589597612482e-03, - "cpu_time": 1.3221067366032818e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4652223617880639e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 320, - "real_time": 2.1762460535683203e+06, - "cpu_time": 5.3855170000002068e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7092459156862993e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 320, - "real_time": 2.1760585470474325e+06, - "cpu_time": 5.3884768656249810e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7099102056624489e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 320, - "real_time": 2.1745750214904547e+06, - "cpu_time": 5.3844780062501486e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7151700144614410e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 320, - "real_time": 2.1768090133264195e+06, - "cpu_time": 5.3872137562500201e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7072521738425026e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 320, - "real_time": 2.1772840787889436e+06, - "cpu_time": 5.3891111249996014e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7055705148645010e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1761945428443146e+06, - "cpu_time": 5.3869593506249916e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7094297649034386e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1762460535683203e+06, - "cpu_time": 5.3872137562500201e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7092459156862993e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0257509651522512e+03, - "cpu_time": 1.9516116532640785e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6349278715044679e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.7135076619187800e-04, - "cpu_time": 3.6228445886410003e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7149114556464160e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 158, - "real_time": 4.4294726486683274e+06, - "cpu_time": 1.1335942386076165e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.5752656493065329e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 158, - "real_time": 4.3424359328243174e+06, - "cpu_time": 1.1207815082278827e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7270989184580135e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 158, - "real_time": 4.2896315166608822e+06, - "cpu_time": 1.1128633025317511e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.8222177988190718e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 158, - "real_time": 4.3302303168309638e+06, - "cpu_time": 1.1180108930379672e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7488792846835175e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 158, - "real_time": 4.3212661336918799e+06, - "cpu_time": 1.1170415430379888e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7649538264686155e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3426073097352739e+06, - "cpu_time": 1.1204582970886413e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7276830955471497e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3302303168309648e+06, - "cpu_time": 1.1180108930379672e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7488792846835175e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2346649554014090e+04, - "cpu_time": 7.8740929982651855e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2204413020025030e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2054198277763490e-02, - "cpu_time": 7.0275645409784062e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1931702151859088e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72, - "real_time": 9.3061325476608351e+06, - "cpu_time": 2.3534528472222544e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2112516833717690e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72, - "real_time": 9.2731477149451766e+06, - "cpu_time": 2.3477120652775813e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2369022971394291e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72, - "real_time": 9.3174770655524395e+06, - "cpu_time": 2.3548053819442634e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2024716055494862e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72, - "real_time": 9.2949988967221640e+06, - "cpu_time": 2.3515656124999393e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2198893991978426e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72, - "real_time": 9.3332237641637530e+06, - "cpu_time": 2.3554226791664708e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.1903198397186279e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3049959978088737e+06, - "cpu_time": 2.3525917172221020e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2121669649954319e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3061325476608351e+06, - "cpu_time": 2.3534528472222544e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2112516833717690e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2738352746415592e+04, - "cpu_time": 3.1032279932986166e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7632408119269472e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4436714160618643e-03, - "cpu_time": 1.3190678053405936e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4448141875873281e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 40, - "real_time": 1.7224082397297025e+07, - "cpu_time": 4.3889106774997801e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7924457688998737e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 40, - "real_time": 1.7193830292671919e+07, - "cpu_time": 4.3856186549999163e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8061563779191275e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 40, - "real_time": 1.7137757735326886e+07, - "cpu_time": 4.3930902925001189e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8316971258924103e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 40, - "real_time": 1.7084873141720891e+07, - "cpu_time": 4.3912295250004262e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8559393966024370e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 40, - "real_time": 1.7168105812743306e+07, - "cpu_time": 4.3890790674998924e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8178530272323170e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7161729875952005e+07, - "cpu_time": 4.3895856435000271e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8208183393092337e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7168105812743306e+07, - "cpu_time": 4.3890790674998924e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8178530272323170e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.3480247205149164e+04, - "cpu_time": 2.8033064008831465e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4395725045992792e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1162503775384980e-03, - "cpu_time": 6.3862665603397052e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1193315056781538e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 21, - "real_time": 3.3249820804312117e+07, - "cpu_time": 8.4815759571429655e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0732903067311277e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 21, - "real_time": 3.3231976308992930e+07, - "cpu_time": 8.4734486238089412e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0776254022352104e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 21, - "real_time": 3.3251184437956128e+07, - "cpu_time": 8.4821705571433380e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0729592204716091e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 21, - "real_time": 3.3269614336036500e+07, - "cpu_time": 8.4774137285713941e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0684871573410444e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 21, - "real_time": 3.3281874975987844e+07, - "cpu_time": 8.4873980238095701e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0655148243201561e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3256894172657110e+07, - "cpu_time": 8.4804013780952424e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0715753822198305e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3251184437956125e+07, - "cpu_time": 8.4815759571429640e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0729592204716091e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9296221329189779e+04, - "cpu_time": 5.2614048375684884e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6831135871768044e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.8021717930156562e-04, - "cpu_time": 6.2041931778826205e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8019820981822549e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 6.5233018994331360e+07, - "cpu_time": 1.6467796249999082e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2300485287466640e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 6.5170713514089584e+07, - "cpu_time": 1.6459435579999989e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2379167428315973e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 6.5285514295101166e+07, - "cpu_time": 1.6478917919998822e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2234308452140846e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 6.5214185416698456e+07, - "cpu_time": 1.6470302660000017e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2324253315373192e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 6.5375610440969467e+07, - "cpu_time": 1.6476292080001259e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2120978814379797e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5255808532238021e+07, - "cpu_time": 1.6470548897999835e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2271838659535294e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5233018994331360e+07, - "cpu_time": 1.6470302660000017e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2300485287466640e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8625597894911320e+04, - "cpu_time": 7.6512778333724607e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9063867521513607e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2048827478103852e-03, - "cpu_time": 4.6454297793934623e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2041042127606822e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6245629638433456e+08, - "cpu_time": 3.2666085749997365e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.6094195663538437e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6236389428377151e+08, - "cpu_time": 3.2681441524999857e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.6131810199339495e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6277373954653740e+08, - "cpu_time": 3.2728688174995565e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.5965298026037836e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6231885924935341e+08, - "cpu_time": 3.2675770175001162e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.6150158334375877e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6226390004158020e+08, - "cpu_time": 3.2649552750001478e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.6172563566193905e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6243533790111542e+08, - "cpu_time": 3.2680307674999082e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.6102805157897110e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6236389428377151e+08, - "cpu_time": 3.2675770175001162e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.6131810199339495e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0187702822550543e+05, - "cpu_time": 2.9625478321922728e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.2055143021360943e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2428147152832019e-03, - "cpu_time": 9.0652384966946479e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2413261861634938e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3462, - "real_time": 2.0154591527857466e+05, - "cpu_time": 2.8193307741192129e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0807281238353951e+06, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3462, - "real_time": 2.0166011516167957e+05, - "cpu_time": 2.8169753986134595e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0778509135483494e+06, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3462, - "real_time": 2.0085465457763337e+05, - "cpu_time": 2.8085561640674330e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0982139405896049e+06, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3462, - "real_time": 2.0108540811823308e+05, - "cpu_time": 2.8085003437322529e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0923635363830784e+06, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3462, - "real_time": 2.0164186059947085e+05, - "cpu_time": 2.8086768861927901e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0783106094920011e+06, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0135759074711829e+05, - "cpu_time": 2.8124079133450298e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0854934247696856e+06, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0154591527857466e+05, - "cpu_time": 2.8086768861927907e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.0807281238353951e+06, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.6565854070047021e+02, - "cpu_time": 5.3106863811467122e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2428196777662561e+03, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8159660102394393e-03, - "cpu_time": 1.8883058733931213e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8174872929237638e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3475, - "real_time": 2.0115673268572328e+05, - "cpu_time": 2.8144512287771440e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0181115852580922e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3475, - "real_time": 2.0125876042636769e+05, - "cpu_time": 2.8074851683452982e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0175954555524947e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3475, - "real_time": 2.0062884122799922e+05, - "cpu_time": 2.8041742877700645e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0207904244797017e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3475, - "real_time": 2.0074878957896432e+05, - "cpu_time": 2.8042168719425489e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0201804973745165e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3475, - "real_time": 2.0165961789362560e+05, - "cpu_time": 2.8140446014391183e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0155726869820358e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0109054836253606e+05, - "cpu_time": 2.8088744316548354e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0184501299293682e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0115673268572328e+05, - "cpu_time": 2.8074851683452987e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0181115852580922e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1427295907122152e+02, - "cpu_time": 5.0878676597641515e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0973738804361841e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0601314305650487e-03, - "cpu_time": 1.8113546132308444e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0593780871544900e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3475, - "real_time": 2.0116552365474775e+05, - "cpu_time": 2.8127769525179366e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0361341872028720e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3475, - "real_time": 2.0161969737960494e+05, - "cpu_time": 2.8143425928058167e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0315475388737168e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3475, - "real_time": 2.0082337151134131e+05, - "cpu_time": 2.8091092661872489e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0396032439723689e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3475, - "real_time": 2.0103895047213885e+05, - "cpu_time": 2.8100195683456154e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0374161277605996e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3475, - "real_time": 2.0174834512512488e+05, - "cpu_time": 2.8103971510789561e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0302520932499591e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0127917762859157e+05, - "cpu_time": 2.8113291061871150e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0349906382119033e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0116552365474781e+05, - "cpu_time": 2.8103971510789561e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0361341872028720e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.9193665609054420e+02, - "cpu_time": 2.1615087264621383e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.9615520049951701e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9472290214428512e-03, - "cpu_time": 7.6885652473242445e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9467175576179010e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3455, - "real_time": 2.0215653601845837e+05, - "cpu_time": 2.8407503096963337e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0523052884384654e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3455, - "real_time": 2.0280315818038653e+05, - "cpu_time": 2.8445468509403488e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0393848268938169e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3455, - "real_time": 2.0221567158193051e+05, - "cpu_time": 2.8378147641102289e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0511202400457360e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3455, - "real_time": 2.0204701241629411e+05, - "cpu_time": 2.8358167293776880e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0545019211278148e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3455, - "real_time": 2.0274254442030881e+05, - "cpu_time": 2.8374747293774423e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0405924782205723e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0239298452347566e+05, - "cpu_time": 2.8392806767004088e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0475809509452812e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0221567158193045e+05, - "cpu_time": 2.8378147641102289e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.0511202400457360e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.5266096465649821e+02, - "cpu_time": 3.4388111600720680e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.0491304579004631e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7424564664967072e-03, - "cpu_time": 1.2111557650117167e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7415662696639070e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3433, - "real_time": 2.0356025387442941e+05, - "cpu_time": 2.8670693387705466e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0487225222792402e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3433, - "real_time": 2.0447426131459052e+05, - "cpu_time": 2.8712090853476070e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0127444376936346e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3433, - "real_time": 2.0360583240583271e+05, - "cpu_time": 2.8683531284591270e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0469207617505580e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3433, - "real_time": 2.0369765029429627e+05, - "cpu_time": 2.8682459044568456e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0432935658947900e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3433, - "real_time": 2.0426168889951441e+05, - "cpu_time": 2.8681759976699244e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0210831939512804e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0391993735773268e+05, - "cpu_time": 2.8686106909408100e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0345528963139012e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0369765029429624e+05, - "cpu_time": 2.8682459044568450e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.0432935658947900e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1878241157064394e+02, - "cpu_time": 1.5423833715274910e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6486232508141451e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0536609465311001e-03, - "cpu_time": 5.3767608703349007e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0519166058020500e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3431, - "real_time": 2.0611079007846446e+05, - "cpu_time": 2.9134854065870371e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5898245786902049e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3431, - "real_time": 2.0575016907891852e+05, - "cpu_time": 2.9144289099385723e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5926110849236459e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3431, - "real_time": 2.0587285574604585e+05, - "cpu_time": 2.9166127892745344e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5916619935763130e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3431, - "real_time": 2.0557090644852244e+05, - "cpu_time": 2.9110645671813894e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5939998789763337e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3431, - "real_time": 2.0631723466435273e+05, - "cpu_time": 2.9122266715242696e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5882337727775690e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0592439120326081e+05, - "cpu_time": 2.9135636689011607e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5912662617888138e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0587285574604585e+05, - "cpu_time": 2.9134854065870371e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.5916619935763130e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9454679143814212e+02, - "cpu_time": 2.1263215584017712e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2755359584062829e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4303637840910512e-03, - "cpu_time": 7.2980095856415770e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4300158389886624e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3379, - "real_time": 2.0956061148247591e+05, - "cpu_time": 3.0105614353354136e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1273052476982450e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3379, - "real_time": 2.0903822977099838e+05, - "cpu_time": 3.0087306333237042e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1351203113322747e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3379, - "real_time": 2.0897704840316784e+05, - "cpu_time": 3.0112349511691439e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1360381678644931e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3379, - "real_time": 2.0946325723594619e+05, - "cpu_time": 3.0084925599289301e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1287587553447682e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3379, - "real_time": 2.0916176549266206e+05, - "cpu_time": 3.0104566291805165e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1332686375846821e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0924018247705008e+05, - "cpu_time": 3.0098952417875419e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1320982239648926e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0916176549266203e+05, - "cpu_time": 3.0104566291805159e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1332686375846821e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5913835845888548e+02, - "cpu_time": 1.2121901812054799e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8778444460808381e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2384732004681192e-03, - "cpu_time": 4.0273500697837386e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2380979678127439e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3262, - "real_time": 2.1455959840064554e+05, - "cpu_time": 3.1784355088902381e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1088854088573670e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3262, - "real_time": 2.1446056355268150e+05, - "cpu_time": 3.1838071857758187e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1117064055370069e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3262, - "real_time": 2.1431331456935659e+05, - "cpu_time": 3.1765048743105301e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1159055965970874e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3262, - "real_time": 2.1447287471832192e+05, - "cpu_time": 3.1828295278971811e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1113555815458465e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3262, - "real_time": 2.1446561509257829e+05, - "cpu_time": 3.1777934181481879e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1115624499256074e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1445439326671680e+05, - "cpu_time": 3.1798741030043917e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1118830884925830e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1446561509257826e+05, - "cpu_time": 3.1784355088902381e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1115624499256074e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8708631017218593e+01, - "cpu_time": 3.2386023550593762e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5287815342571607e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1364800070517428e-04, - "cpu_time": 1.0184687349727138e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1374834852753243e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3017, - "real_time": 2.3091418605268787e+05, - "cpu_time": 3.4955654690095852e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1352442415131066e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3017, - "real_time": 2.3128245008354934e+05, - "cpu_time": 3.4952557739473355e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1334366265373878e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3017, - "real_time": 2.3100731296592602e+05, - "cpu_time": 3.4976118230026716e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1347865859063377e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3017, - "real_time": 2.3057911454012786e+05, - "cpu_time": 3.4927568180311256e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1368939486250775e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3017, - "real_time": 2.3110897903176895e+05, - "cpu_time": 3.4975522936691518e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1342873872674799e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3097840853481198e+05, - "cpu_time": 3.4957484355319745e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1349297579698780e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3100731296592602e+05, - "cpu_time": 3.4955654690095858e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1347865859063377e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6167040600576809e+02, - "cpu_time": 1.9970030352590530e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2864218459587819e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1328782099835548e-03, - "cpu_time": 5.7126623156312844e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1334814660775901e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2701, - "real_time": 2.5918079901835578e+05, - "cpu_time": 4.2107576305072714e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0228658989621708e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2701, - "real_time": 2.5871566001604102e+05, - "cpu_time": 4.2075596556831623e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0265027635648062e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2701, - "real_time": 2.5897097813675122e+05, - "cpu_time": 4.2087789633472147e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0245048451844146e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2701, - "real_time": 2.5863219533773861e+05, - "cpu_time": 4.2023705331352225e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0271567478880613e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2701, - "real_time": 2.5920473004971285e+05, - "cpu_time": 4.2073140910774120e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0226791382219253e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5894087251171996e+05, - "cpu_time": 4.2073561747500568e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0247418787642758e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5897097813675128e+05, - "cpu_time": 4.2075596556831629e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0245048451844146e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6177000567030160e+02, - "cpu_time": 3.1021777230510622e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0471133239955232e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0109257883127493e-03, - "cpu_time": 7.3732234548346757e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0110490356651787e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2200, - "real_time": 3.1774565425373358e+05, - "cpu_time": 5.6788733590906311e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3000482806372762e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2200, - "real_time": 3.1774652157433919e+05, - "cpu_time": 5.6803139272729331e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3000392728286014e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2200, - "real_time": 3.1761676630015823e+05, - "cpu_time": 5.6807508954555239e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3013874305648632e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2200, - "real_time": 3.1787633618064737e+05, - "cpu_time": 5.6824245090917265e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.2986916000066772e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2200, - "real_time": 3.1813168275138282e+05, - "cpu_time": 5.6859553727266844e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.2960439241113033e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1782339221205225e+05, - "cpu_time": 5.6816636127274984e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.2992421016297445e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1774652157433925e+05, - "cpu_time": 5.6807508954555239e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3000392728286014e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9525155127631868e+02, - "cpu_time": 2.7128576337518098e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0260327133390517e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1433977504728968e-04, - "cpu_time": 4.7747593287197351e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1409034285123891e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1645, - "real_time": 4.2546427391871449e+05, - "cpu_time": 8.5689001580553257e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9290907099773636e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1645, - "real_time": 4.2559680209415866e+05, - "cpu_time": 8.5652089361705806e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9275558220384092e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1645, - "real_time": 4.2507560362142022e+05, - "cpu_time": 8.5524496474158077e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9335976521196928e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1645, - "real_time": 4.2466825501650776e+05, - "cpu_time": 8.5493952401216724e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9383300381576185e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1645, - "real_time": 4.2476143877624924e+05, - "cpu_time": 8.5440055075978476e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9372466720189085e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2511327468541003e+05, - "cpu_time": 8.5559918978722463e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9331641788623991e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2507560362142028e+05, - "cpu_time": 8.5524496474158077e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9335976521196928e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1238614752658816e+02, - "cpu_time": 1.0622075592379356e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7850696623560246e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.7006179783908129e-04, - "cpu_time": 1.2414779863245216e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6997981191444447e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1049, - "real_time": 6.6710906127668405e+05, - "cpu_time": 1.4755955996187201e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2872838092966766e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1049, - "real_time": 6.6647987641408341e+05, - "cpu_time": 1.4746705567207178e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2932192680249538e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1049, - "real_time": 6.6655002585661074e+05, - "cpu_time": 1.4757747836033779e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2925569534105539e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1049, - "real_time": 6.6734012133096496e+05, - "cpu_time": 1.4764087473785782e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2851068981657248e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1049, - "real_time": 6.6714454187014559e+05, - "cpu_time": 1.4754703355576342e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2869494341398478e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6692472534969798e+05, - "cpu_time": 1.4755840045758060e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2890232726075516e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6710906127668405e+05, - "cpu_time": 1.4755955996187204e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.2872838092966766e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8507893447047451e+02, - "cpu_time": 6.2530780413882474e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6317284071141663e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7739489905485309e-04, - "cpu_time": 4.2376970894217938e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7747097596736689e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 599, - "real_time": 1.1613613326111822e+06, - "cpu_time": 2.7354408848080467e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2230818819662399e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 599, - "real_time": 1.1687136093117236e+06, - "cpu_time": 2.7482385075126663e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.1776420956886120e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 599, - "real_time": 1.1642779591330055e+06, - "cpu_time": 2.7414842287147567e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2049873779683027e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 599, - "real_time": 1.1634172963830510e+06, - "cpu_time": 2.7396841736228638e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2103174209970493e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 599, - "real_time": 1.1653875298906921e+06, - "cpu_time": 2.7430373021701896e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.1981274767774572e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1646315454659308e+06, - "cpu_time": 2.7415770193657046e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2028312506795321e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1642779591330055e+06, - "cpu_time": 2.7414842287147562e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2049873779683027e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7170054258956138e+03, - "cpu_time": 4.6837877999611546e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6788379288505487e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3329313347841946e-03, - "cpu_time": 1.7084283121999624e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3308028057608086e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 320, - "real_time": 2.1812122962728608e+06, - "cpu_time": 5.4010114312504241e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6916932976528749e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 320, - "real_time": 2.1810107711644378e+06, - "cpu_time": 5.4014122031254889e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6924040091020155e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 320, - "real_time": 2.1828463162819389e+06, - "cpu_time": 5.4068838031248841e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6859355030439234e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 320, - "real_time": 2.1846898074727505e+06, - "cpu_time": 5.4103573749998193e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6794499350037642e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 320, - "real_time": 2.1813938023115043e+06, - "cpu_time": 5.4053018312501423e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6910532991439228e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1822305987006989e+06, - "cpu_time": 5.4049933287501512e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6881072087893009e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1813938023115043e+06, - "cpu_time": 5.4053018312501423e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6910532991439228e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5533804401185664e+03, - "cpu_time": 3.9090288995990859e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4696130990628581e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.1183148153245129e-04, - "cpu_time": 7.2322548092820826e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1143819285061655e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 160, - "real_time": 4.5907013904070482e+06, - "cpu_time": 1.1585451237499457e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.3092168595668116e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 160, - "real_time": 4.8797407274832949e+06, - "cpu_time": 1.2000801749999823e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 6.8762735304802866e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 160, - "real_time": 4.8517164890654385e+06, - "cpu_time": 1.1967856043750657e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 6.9159919124753761e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 160, - "real_time": 4.6211746172048151e+06, - "cpu_time": 1.1630366299999651e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.2610179834095707e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 160, - "real_time": 4.4571333215571940e+06, - "cpu_time": 1.1396599837500786e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.5282540546211548e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6800933091435581e+06, - "cpu_time": 1.1716215033750076e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.1781508681106405e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time_median", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6211746172048151e+06, - "cpu_time": 1.1630366299999651e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.2610179834095707e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8061498484060523e+05, - "cpu_time": 2.6025749083823897e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7680080342806870e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.8592176033699029e-02, - "cpu_time": 2.2213444366506890e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8561575051002710e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 72, - "real_time": 9.5757290384628698e+06, - "cpu_time": 2.3963306111110367e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0082250375343275e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 72, - "real_time": 9.5352375000301339e+06, - "cpu_time": 2.3905531083332535e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0379855771592388e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 72, - "real_time": 9.5767157359255683e+06, - "cpu_time": 2.3977439722222645e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0075029739320202e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 72, - "real_time": 9.5693778453601729e+06, - "cpu_time": 2.3964598111111477e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0128763943142376e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 72, - "real_time": 9.4255922206987944e+06, - "cpu_time": 2.3740036805558398e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.1198564958738146e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5365304680955075e+06, - "cpu_time": 2.3910182366667088e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0372892957627296e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time_median", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5693778453601729e+06, - "cpu_time": 2.3963306111110367e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.0128763943142376e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.4302605632322571e+04, - "cpu_time": 9.9093268874546513e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7816767910313636e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7427672828653069e-03, - "cpu_time": 4.1443961971905034e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7947708131176187e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 40, - "real_time": 1.7484410572797060e+07, - "cpu_time": 4.4393115274999671e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6764228019685869e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 40, - "real_time": 1.7495974851772189e+07, - "cpu_time": 4.4321344449997470e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6713489323748608e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 40, - "real_time": 1.7500338843092322e+07, - "cpu_time": 4.4389263850001730e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6694359579773502e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 40, - "real_time": 1.7484646802768111e+07, - "cpu_time": 4.4370912899995573e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6763190880556479e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 40, - "real_time": 1.7422093916684389e+07, - "cpu_time": 4.4291965650000975e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7038804085119448e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7477492997422818e+07, - "cpu_time": 4.4353320424999088e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6794814377776794e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time_median", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7484646802768111e+07, - "cpu_time": 4.4370912899995573e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.6763190880556479e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1747438994957618e+04, - "cpu_time": 4.4642822645624765e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3979581450398292e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8164755665837774e-03, - "cpu_time": 1.0065271825841140e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8203809155170980e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 21, - "real_time": 3.3300620991559256e+07, - "cpu_time": 8.4887419238092273e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0609744805672131e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 21, - "real_time": 3.3372240939310618e+07, - "cpu_time": 8.4914671714289263e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0436748760194330e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 21, - "real_time": 3.3355456909963064e+07, - "cpu_time": 8.4928081190474540e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0477223479382181e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 21, - "real_time": 3.3308994557176318e+07, - "cpu_time": 8.4869175047612906e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0589480279634085e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 21, - "real_time": 3.3337551390840895e+07, - "cpu_time": 8.4914554857147902e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0520447603644199e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3334972957770027e+07, - "cpu_time": 8.4902780409523383e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0526728985705385e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time_median", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3337551390840895e+07, - "cpu_time": 8.4914554857147902e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0520447603644199e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0290584106728307e+04, - "cpu_time": 2.3903222576620879e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3171106243270645e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.0867282673669887e-04, - "cpu_time": 2.8153639328800712e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0865613399321776e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 6.5459381043910980e+07, - "cpu_time": 1.6513057130000561e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2015885796393366e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 6.5259122848510742e+07, - "cpu_time": 1.6496014879999167e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2267564834768810e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 6.5393204241991043e+07, - "cpu_time": 1.6523899280000478e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2098884467150517e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 6.5420245379209518e+07, - "cpu_time": 1.6525953020000088e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2064949296356049e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 6.5493605285882950e+07, - "cpu_time": 1.6536266680000153e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.1973027695838537e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5405111759901047e+07, - "cpu_time": 1.6519038198000091e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2084062418101463e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time_median", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5420245379209518e+07, - "cpu_time": 1.6523899280000478e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2064949296356049e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.0083068599616279e+04, - "cpu_time": 1.5281621473608242e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1317564091043619e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3773092985500399e-03, - "cpu_time": 9.2509147871928411e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3787772872883336e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.5851150080561638e+08, - "cpu_time": 3.2908959750000119e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.7739048494451904e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.5879665687680244e+08, - "cpu_time": 3.2917533074999028e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.7617407388685141e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.5887149795889854e+08, - "cpu_time": 3.2930925224997056e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.7585554224319487e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.5830601379275322e+08, - "cpu_time": 3.2831797024999785e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.7826976264192476e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.5864221379160881e+08, - "cpu_time": 3.2919135324999613e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.7683235019051046e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5862557664513588e+08, - "cpu_time": 3.2901670079999125e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.7690444278140020e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time_median", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5864221379160881e+08, - "cpu_time": 3.2917533074999028e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.7683235019051046e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2647088479744206e+05, - "cpu_time": 3.9836905017034104e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.6684586519920528e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/6/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4277072436060178e-03, - "cpu_time": 1.2107867144789985e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4283343469078675e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3541, - "real_time": 1.9680571802470315e+05, - "cpu_time": 2.7396188619032287e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2031008564063516e+06, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3541, - "real_time": 1.9609901435880095e+05, - "cpu_time": 2.7376811493928405e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2218518453458138e+06, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3541, - "real_time": 1.9717966879433821e+05, - "cpu_time": 2.7422384975998063e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.1932331880932897e+06, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3541, - "real_time": 1.9642006089063050e+05, - "cpu_time": 2.7356023467947112e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2133167832087064e+06, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3541, - "real_time": 1.9654906276845318e+05, - "cpu_time": 2.7388537305846444e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2098951049506385e+06, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9661070496738522e+05, - "cpu_time": 2.7387989172550465e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2082795556009607e+06, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time_median", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9654906276845318e+05, - "cpu_time": 2.7388537305846449e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 5.2098951049506385e+06, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.0734571695380544e+02, - "cpu_time": 2.4481367598454335e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0786598294576223e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0718389521128971e-03, - "cpu_time": 8.9387239947468357e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0710482568041806e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3583, - "real_time": 1.9638930225274764e+05, - "cpu_time": 2.7336799441808643e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0428266593484202e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3583, - "real_time": 1.9645873659644913e+05, - "cpu_time": 2.7386425704718003e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0424580934808964e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3583, - "real_time": 1.9601535272772575e+05, - "cpu_time": 2.7350771281049686e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0448161184827013e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3583, - "real_time": 1.9633642248134824e+05, - "cpu_time": 2.7324710856827418e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0431075264165811e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3583, - "real_time": 1.9656662469089840e+05, - "cpu_time": 2.7359860396316566e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0418859270847665e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9635328774983383e+05, - "cpu_time": 2.7351713536144065e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0430188649626732e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time_median", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9638930225274764e+05, - "cpu_time": 2.7350771281049692e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 1.0428266593484202e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0761362581969215e+02, - "cpu_time": 2.3578426165463515e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1037364898663540e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0573473365223438e-03, - "cpu_time": 8.6204566797270957e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0582133525512539e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3585, - "real_time": 1.9644228287717924e+05, - "cpu_time": 2.7356866917711101e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0850908165025372e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3585, - "real_time": 1.9649284893570200e+05, - "cpu_time": 2.7426148898189270e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0845542329839833e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3585, - "real_time": 1.9662299231110423e+05, - "cpu_time": 2.7325797043238080e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0831744812016468e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3585, - "real_time": 1.9581432593434353e+05, - "cpu_time": 2.7334711827061354e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0917774940396279e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3585, - "real_time": 1.9651252637238006e+05, - "cpu_time": 2.7325424267782102e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0843454998071283e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9637699528614184e+05, - "cpu_time": 2.7353789790796384e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0857885049069852e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time_median", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9649284893570200e+05, - "cpu_time": 2.7334711827061360e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 2.0845542329839833e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2138938560530903e+02, - "cpu_time": 4.2418965819053130e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4202913166315237e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6365938644544954e-03, - "cpu_time": 1.5507527894114939e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6398073479573856e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3527, - "real_time": 1.9723905089950579e+05, - "cpu_time": 2.7547491834424267e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1533357429172896e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3527, - "real_time": 1.9747435987006390e+05, - "cpu_time": 2.7505857952933176e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1483866591036178e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3527, - "real_time": 1.9760210829938654e+05, - "cpu_time": 2.7535656620361563e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1457047551275700e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3527, - "real_time": 1.9743317244606777e+05, - "cpu_time": 2.7579514374818694e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1492520727426313e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3527, - "real_time": 1.9727462057457556e+05, - "cpu_time": 2.7573659824209614e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1525868741454177e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9740466241791990e+05, - "cpu_time": 2.7548436121349467e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1498532208073057e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time_median", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9743317244606774e+05, - "cpu_time": 2.7547491834424261e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 4.1492520727426313e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4915888230264406e+02, - "cpu_time": 2.9913211020464757e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1353935369025050e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.5559959159862157e-04, - "cpu_time": 1.0858406222661273e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5554323733227136e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3504, - "real_time": 1.9897943693483603e+05, - "cpu_time": 2.7920598344751575e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2340166664385587e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3504, - "real_time": 1.9858526845120947e+05, - "cpu_time": 2.7857927539955021e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2503602244923785e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3504, - "real_time": 1.9920416655967524e+05, - "cpu_time": 2.7870305964614335e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2247275661736086e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3504, - "real_time": 1.9880407984036533e+05, - "cpu_time": 2.7847792522828712e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2412795618459836e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3504, - "real_time": 1.9849308290713243e+05, - "cpu_time": 2.7859828681505041e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2541919144182295e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9881320693864374e+05, - "cpu_time": 2.7871290610730939e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2409151866737515e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time_median", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9880407984036530e+05, - "cpu_time": 2.7859828681505041e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 8.2412795618459836e+07, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8939613440841674e+02, - "cpu_time": 2.8698126154719603e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1992097889860639e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4556182602986135e-03, - "cpu_time": 1.0296662094173106e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4551900630227167e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3464, - "real_time": 2.0121101852790447e+05, - "cpu_time": 2.8335921275983128e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6285390452141491e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3464, - "real_time": 2.0085531333105167e+05, - "cpu_time": 2.8350090733251092e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6314231103257629e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3464, - "real_time": 2.0118722345793055e+05, - "cpu_time": 2.8327151876443520e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6287316578456578e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3464, - "real_time": 2.0122482501035291e+05, - "cpu_time": 2.8346505600464297e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6284273075309721e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3464, - "real_time": 2.0078325011698485e+05, - "cpu_time": 2.8358280571594747e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6320086451886785e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0105232608884491e+05, - "cpu_time": 2.8343590011547355e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6298259532210442e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time_median", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0118722345793052e+05, - "cpu_time": 2.8346505600464303e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 1.6287316578456578e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1468137648062174e+02, - "cpu_time": 1.2202401267946018e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7410398754767221e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0677885735365935e-03, - "cpu_time": 4.3051713854789326e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0682366862767674e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3400, - "real_time": 2.0508331866414449e+05, - "cpu_time": 2.9320012352941907e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1955792614866590e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3400, - "real_time": 2.0446274682934233e+05, - "cpu_time": 2.9300835264708061e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2052782727555031e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3400, - "real_time": 2.0488401797004318e+05, - "cpu_time": 2.9290742941177142e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1986877575576562e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3400, - "real_time": 2.0489766933571766e+05, - "cpu_time": 2.9291755823531759e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1984746440732598e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3400, - "real_time": 2.0436152446028939e+05, - "cpu_time": 2.9287652647058968e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2068658801150537e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0473785545190744e+05, - "cpu_time": 2.9298199805883574e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.2009771631976265e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time_median", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0488401797004318e+05, - "cpu_time": 2.9291755823531759e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 3.1986877575576562e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0966052365821622e+02, - "cpu_time": 1.3144439425936690e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8429808329168515e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5124732208155565e-03, - "cpu_time": 4.4864324473946240e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5129695046243129e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3270, - "real_time": 2.1380520528890847e+05, - "cpu_time": 3.0990514617739210e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1304400808617544e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3270, - "real_time": 2.1409954965956201e+05, - "cpu_time": 3.1021692568802909e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1220119429684246e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3270, - "real_time": 2.1347839817200397e+05, - "cpu_time": 3.0951006972477154e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1398249716298032e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3270, - "real_time": 2.1341172758890715e+05, - "cpu_time": 3.0930729785931687e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1417430747987139e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3270, - "real_time": 2.1402497497897749e+05, - "cpu_time": 3.1000580030578945e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1241450916125321e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1376397113767182e+05, - "cpu_time": 3.0978904795105988e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1316330323742473e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time_median", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1380520528890850e+05, - "cpu_time": 3.0990514617739210e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 6.1304400808617544e+08, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1147377141243049e+02, - "cpu_time": 3.7197168601221387e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9355830533882906e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4570919961616451e-03, - "cpu_time": 1.2007257469959930e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4572925362965367e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 3075, - "real_time": 2.2798358658196146e+05, - "cpu_time": 3.4344608162597968e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1498371612193129e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 3075, - "real_time": 2.2773045100975875e+05, - "cpu_time": 3.4274045626017783e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1511152717506654e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 3075, - "real_time": 2.2768612000788370e+05, - "cpu_time": 3.4298198991874832e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1513393964942753e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 3075, - "real_time": 2.2722646399075544e+05, - "cpu_time": 3.4261561268289277e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1536684389484894e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 3075, - "real_time": 2.2786100180176034e+05, - "cpu_time": 3.4311976585363812e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1504557512130399e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2769752467842394e+05, - "cpu_time": 3.4298078126828739e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1512832039251564e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time_median", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2773045100975875e+05, - "cpu_time": 3.4298198991874838e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 1.1511152717506654e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8795336592082424e+02, - "cpu_time": 3.2669818018640206e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4574311679389870e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2646310772482015e-03, - "cpu_time": 9.5252619980141465e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2659189007275164e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2736, - "real_time": 2.5569378064643408e+05, - "cpu_time": 4.1465689290935296e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0504526886595266e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2736, - "real_time": 2.5526278160634311e+05, - "cpu_time": 4.1429124707610556e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0539147802931089e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2736, - "real_time": 2.5555605946981133e+05, - "cpu_time": 4.1449080519000400e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0515576937902105e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2736, - "real_time": 2.5548681671289002e+05, - "cpu_time": 4.1434199451755668e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0521137127368195e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2736, - "real_time": 2.5573851989283651e+05, - "cpu_time": 4.1504535782164510e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0500939796620984e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5554759166566300e+05, - "cpu_time": 4.1456525950293284e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0516265710283527e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time_median", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5555605946981133e+05, - "cpu_time": 4.1449080519000400e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 2.0515576937902105e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8888281713419133e+02, - "cpu_time": 3.0387686043223698e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5169697480965136e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.3912970927665687e-04, - "cpu_time": 7.3300126690931079e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3939856771115570e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2248, - "real_time": 3.1114509171251958e+05, - "cpu_time": 5.6144970596080821e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3700547684320369e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2248, - "real_time": 3.1118744006442581e+05, - "cpu_time": 5.6119104092534538e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3695961500981884e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2248, - "real_time": 3.1091455801877315e+05, - "cpu_time": 5.6103261209970608e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3725535616015978e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2248, - "real_time": 3.1107028961194900e+05, - "cpu_time": 5.6148835186831187e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3708651549721050e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2248, - "real_time": 3.1097036193373939e+05, - "cpu_time": 5.6091161209964461e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3719483537901511e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1105754826828151e+05, - "cpu_time": 5.6121466459076328e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3710035977788162e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time_median", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1107028961194900e+05, - "cpu_time": 5.6119104092534550e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 3.3708651549721050e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1483220744200244e+02, - "cpu_time": 2.5282957245702073e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2445184082527666e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.6916708204412946e-04, - "cpu_time": 4.5050421596054264e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6918335212480661e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1664, - "real_time": 4.2094680342275894e+05, - "cpu_time": 8.4894627463942650e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9819881822307606e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1664, - "real_time": 4.2099496027521335e+05, - "cpu_time": 8.4919302163463878e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9814183016087580e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1664, - "real_time": 4.2045150903154886e+05, - "cpu_time": 8.4871095072112617e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9878569940930786e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1664, - "real_time": 4.2085901208548213e+05, - "cpu_time": 8.4879797415860789e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9830274267099218e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1664, - "real_time": 4.2106247668436065e+05, - "cpu_time": 8.4898754807688063e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9806195425295038e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2086295229987276e+05, - "cpu_time": 8.4892715384613606e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9829820894344053e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time_median", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2094680342275894e+05, - "cpu_time": 8.4894627463942650e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9819881822307606e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4164446235335805e+02, - "cpu_time": 1.8582917676915872e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8627636401770930e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7416425236018825e-04, - "cpu_time": 2.1889884889091362e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7450811357462285e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1050, - "real_time": 6.6211849534218863e+05, - "cpu_time": 1.4687592523809404e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3346727655332251e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1050, - "real_time": 6.6208404788215249e+05, - "cpu_time": 1.4682678761902847e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3350023511615620e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1050, - "real_time": 6.6238835514966573e+05, - "cpu_time": 1.4700422457142503e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3320919931515141e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1050, - "real_time": 6.6203653357834334e+05, - "cpu_time": 1.4691540666667821e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3354570137233362e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1050, - "real_time": 6.6241397145425994e+05, - "cpu_time": 1.4698437009524025e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3318471239244070e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6220828068132210e+05, - "cpu_time": 1.4692134283809324e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3338142494988089e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time_median", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6211849534218875e+05, - "cpu_time": 1.4691540666667824e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 6.3346727655332251e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7869511091732025e+02, - "cpu_time": 7.3960298118862852e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7090245455463768e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6984729144955311e-04, - "cpu_time": 5.0340064071131461e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6982549191138832e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 609, - "real_time": 1.1506513233659009e+06, - "cpu_time": 2.7342342840724792e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.2903127382337942e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 609, - "real_time": 1.1456313943306876e+06, - "cpu_time": 2.7215915155994734e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3222574394453278e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 609, - "real_time": 1.1470035945366584e+06, - "cpu_time": 2.7267017110015391e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3134975687575302e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 609, - "real_time": 1.1464014629510725e+06, - "cpu_time": 2.7227033628899772e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3173388826685572e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 609, - "real_time": 1.1451621492101226e+06, - "cpu_time": 2.7234885467978218e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3252578298942699e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1469699848788886e+06, - "cpu_time": 2.7257438840722586e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3137328917998962e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time_median", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1464014629510727e+06, - "cpu_time": 2.7234885467978218e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 7.3173388826685572e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1758156118849920e+03, - "cpu_time": 5.1131644751414660e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3847872135469766e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8970118142322108e-03, - "cpu_time": 1.8758785464107518e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8934068744834664e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 321, - "real_time": 2.1731840175318290e+06, - "cpu_time": 5.3857950498443404e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7201083132640314e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 321, - "real_time": 2.1764119866527501e+06, - "cpu_time": 5.3895866978190299e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7086581506118269e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 321, - "real_time": 2.1745966387639907e+06, - "cpu_time": 5.3894281869160123e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7150933193458471e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 321, - "real_time": 2.1789979285377767e+06, - "cpu_time": 5.3935117975075105e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.6995098436180725e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 321, - "real_time": 2.1770180818099654e+06, - "cpu_time": 5.3914158380058184e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7065120130061016e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1760417306592627e+06, - "cpu_time": 5.3899475140185431e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7099763279691763e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time_median", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1764119866527501e+06, - "cpu_time": 5.3895866978190299e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 7.7086581506118269e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2407739661843825e+03, - "cpu_time": 2.8505674786647637e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.9392551782040615e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0297476995101138e-03, - "cpu_time": 5.2886739086991361e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0297379447720403e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 160, - "real_time": 4.2668307229178026e+06, - "cpu_time": 1.1107934756250869e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.8640176231445026e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 160, - "real_time": 4.3039920186856762e+06, - "cpu_time": 1.1155950993750708e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7961185462994013e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 160, - "real_time": 4.2302293644752353e+06, - "cpu_time": 1.1054599956248978e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.9320597322179632e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 160, - "real_time": 4.3518763442989439e+06, - "cpu_time": 1.1214067487500755e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7103367249754381e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 160, - "real_time": 4.3444013514090329e+06, - "cpu_time": 1.1212524475000408e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7236031586071548e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2994659603573382e+06, - "cpu_time": 1.1149015533750344e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.8052271570488930e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time_median", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3039920186856762e+06, - "cpu_time": 1.1155950993750708e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 7.7961185462994013e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1588002117593431e+04, - "cpu_time": 6.8766224386716291e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.3931436481811777e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1998699976521232e-02, - "cpu_time": 6.1679189681408996e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2034427005366832e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 73, - "real_time": 9.3191201377609000e+06, - "cpu_time": 2.3560096246577416e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2012017237631845e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 73, - "real_time": 9.2185604041569848e+06, - "cpu_time": 2.3414394534247302e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2797553042813673e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 73, - "real_time": 9.2239982690917309e+06, - "cpu_time": 2.3424697821918964e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2754636375932541e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 73, - "real_time": 9.2659011253551263e+06, - "cpu_time": 2.3473463643833306e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2425620662370253e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 73, - "real_time": 9.2929588656311166e+06, - "cpu_time": 2.3537083383563150e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2214743409867020e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2641077603991721e+06, - "cpu_time": 2.3481947126028027e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2440914145723076e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time_median", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2659011253551263e+06, - "cpu_time": 2.3473463643833309e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 7.2425620662370253e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3431834659027772e+04, - "cpu_time": 6.5307152908992473e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3946744718707860e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6881832317067504e-03, - "cpu_time": 2.7811642943614437e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6861287048946057e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 40, - "real_time": 1.7224948294460773e+07, - "cpu_time": 4.4054514049997807e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7920540430975895e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 40, - "real_time": 1.7243680730462074e+07, - "cpu_time": 4.4096454124996856e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7835892520844307e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 40, - "real_time": 1.7132183676585555e+07, - "cpu_time": 4.3942289749998048e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.8342452155374975e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 40, - "real_time": 1.7269636550918221e+07, - "cpu_time": 4.4114464674998999e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7718907172290020e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 40, - "real_time": 1.7215032083913684e+07, - "cpu_time": 4.4064711149997041e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7965424255826769e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7217096267268062e+07, - "cpu_time": 4.4054486749997750e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7956643307062397e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time_median", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7224948294460773e+07, - "cpu_time": 4.4064711149997041e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 7.7920540430975895e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1824893462980872e+04, - "cpu_time": 6.7177596639861687e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3522766222309824e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0100832717946014e-03, - "cpu_time": 1.5248752532536342e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0174165054357598e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 21, - "real_time": 3.3282784656399772e+07, - "cpu_time": 8.4785526190476701e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0652943787978373e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 21, - "real_time": 3.3302700235730127e+07, - "cpu_time": 8.4791552761901453e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0604711960262718e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 21, - "real_time": 3.3324392601138070e+07, - "cpu_time": 8.4793772619042054e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0552242680886135e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 21, - "real_time": 3.3243919057505470e+07, - "cpu_time": 8.4792385761905581e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0747235467532940e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 21, - "real_time": 3.3270905770006634e+07, - "cpu_time": 8.4843887142856807e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0681739732493753e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3284940464156013e+07, - "cpu_time": 8.4801424895236522e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0647774725830784e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time_median", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.3282784656399775e+07, - "cpu_time": 8.4792385761905581e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 8.0652943787978373e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0644153392450669e+04, - "cpu_time": 2.3945425276261165e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4252194267482767e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.2066120489086743e-04, - "cpu_time": 2.8237055339392340e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2069737224504517e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 6.5195395052433014e+07, - "cpu_time": 1.6454250849999425e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2347980492828474e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 6.4974336326122284e+07, - "cpu_time": 1.6438772219999009e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2628148643998756e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 6.5133985131978989e+07, - "cpu_time": 1.6457565970001724e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2425620190773678e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 6.5289857983589172e+07, - "cpu_time": 1.6473592320000988e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2228837461240053e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 6.5253905951976776e+07, - "cpu_time": 1.6464169139999285e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2274141933374376e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5169496089220047e+07, - "cpu_time": 1.6457670100000089e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2380945744443073e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time_median", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5195395052433014e+07, - "cpu_time": 1.6457565970001724e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 8.2347980492828474e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2412808712834879e+05, - "cpu_time": 1.2889788522769666e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5711124354255490e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9046961320433060e-03, - "cpu_time": 7.8320858568975687e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9071308555977907e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5, - "real_time": 1.4631676971912384e+08, - "cpu_time": 3.2085087999998903e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.3384740933059311e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5, - "real_time": 1.4654195606708527e+08, - "cpu_time": 3.2106271120001113e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.3271972943260908e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5, - "real_time": 1.4648199677467346e+08, - "cpu_time": 3.2107026319999933e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.3301965268243017e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5, - "real_time": 1.4626535177230835e+08, - "cpu_time": 3.2115781339998645e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.3410538517112150e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5, - "real_time": 1.4647687077522278e+08, - "cpu_time": 3.2112276379998547e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.3304530491214476e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time_mean", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4641658902168277e+08, - "cpu_time": 3.2105288631999433e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.3334749630577974e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time_median", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4647687077522278e+08, - "cpu_time": 3.2107026319999933e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 7.3304530491214476e+09, - "hip_id": 7.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time_stddev", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1881241389712466e+05, - "cpu_time": 1.1947551193671697e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9523123479333641e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time_cv", - "family_index": 7, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_GPUToHost/0/7/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.1146825432144019e-04, - "cpu_time": 3.7213654518475619e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1166328076634790e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - } - ] -} diff --git a/results/prefetch_managed_HostToGPU.json b/results/prefetch_managed_HostToGPU.json deleted file mode 100644 index b1e2669..0000000 --- a/results/prefetch_managed_HostToGPU.json +++ /dev/null @@ -1,23444 +0,0 @@ -{ - "context": { - "date": "2023-10-09T16:29:18-04:00", - "host_name": "frontier10439", - "executable": "/lustre/orion/csc465/scratch/cpearson/frontier-gpu-bandwidth/build/comm_scope", - "num_cpus": 128, - "mhz_per_cpu": 1837, - "cpu_scaling_enabled": false, - "caches": [ - { - "type": "Data", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Instruction", - "level": 1, - "size": 32768, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 2, - "size": 524288, - "num_sharing": 2 - }, - { - "type": "Unified", - "level": 3, - "size": 33554432, - "num_sharing": 16 - } - ], - "load_avg": [2.11,2.17,4.33], - "library_build_type": "release" - }, - "benchmarks": [ - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9033, - "real_time": 7.7622128175128732e+04, - "cpu_time": 2.7965941226613527e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3192114466247069e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9033, - "real_time": 7.7436884263685599e+04, - "cpu_time": 2.7887871947304334e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3223672539730653e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9033, - "real_time": 7.7400070028531904e+04, - "cpu_time": 2.7894172689029103e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3229962190247685e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9033, - "real_time": 7.7558241222929573e+04, - "cpu_time": 2.7920338724676182e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3202981190053873e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9033, - "real_time": 7.7307865440764654e+04, - "cpu_time": 2.7880830942101195e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3245741480013002e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7465037826208092e+04, - "cpu_time": 2.7909831105944875e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3218894373258457e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time_median", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7436884263685599e+04, - "cpu_time": 2.7894172689029103e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3223672539730653e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2557950414638132e+02, - "cpu_time": 3.4738868230188717e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1427128879792785e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6211120225374117e-03, - "cpu_time": 1.2446821372125480e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6209471287658831e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9301, - "real_time": 7.7195294497975920e+04, - "cpu_time": 2.7875992635200504e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6530114475483984e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9301, - "real_time": 7.7382355819046192e+04, - "cpu_time": 2.7877881238576508e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6465981531876855e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9301, - "real_time": 7.7345920500265973e+04, - "cpu_time": 2.7866944285560661e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6478448853588309e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9301, - "real_time": 7.7405324886844028e+04, - "cpu_time": 2.7871900688098074e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6458128080902644e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9301, - "real_time": 7.6994885602807641e+04, - "cpu_time": 2.7849192312654556e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6599169333986502e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7264756261387942e+04, - "cpu_time": 2.7868382232018060e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6506368455167662e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time_median", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7345920500265973e+04, - "cpu_time": 2.7871900688098074e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6478448853588309e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7163328424413587e+02, - "cpu_time": 1.1520086694981407e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8978000185980367e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2213657629812180e-03, - "cpu_time": 4.1337479151358654e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2250501907017015e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9061, - "real_time": 7.7477862720084086e+04, - "cpu_time": 2.7899607493654115e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2866713874106653e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9061, - "real_time": 7.7454629817347697e+04, - "cpu_time": 2.7908812040613568e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2882571508754529e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9061, - "real_time": 7.7450707062008179e+04, - "cpu_time": 2.7873792583600042e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2885249927036583e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9061, - "real_time": 7.7566102187136581e+04, - "cpu_time": 2.7905493521686381e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2806572516921870e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9061, - "real_time": 7.7625824017308114e+04, - "cpu_time": 2.7926438141485455e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2765945506571643e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7515025160776946e+04, - "cpu_time": 2.7902828756207915e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2841410666678265e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time_median", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7477862720084086e+04, - "cpu_time": 2.7905493521686381e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2866713874106653e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7541459171466514e+01, - "cpu_time": 1.9064230854563536e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2832364701951396e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0003410178947209e-03, - "cpu_time": 6.8323649265567964e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.9982880917423014e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8950, - "real_time": 7.7925954951726511e+04, - "cpu_time": 2.8070843877094961e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0512543612811381e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8950, - "real_time": 7.7644784487855446e+04, - "cpu_time": 2.8051572581005574e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0550612064975625e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8950, - "real_time": 7.7769835398261886e+04, - "cpu_time": 2.8044154391061427e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0533647085722244e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8950, - "real_time": 7.7674976165026586e+04, - "cpu_time": 2.8042990290502791e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0546511121671222e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8950, - "real_time": 7.7907380543248568e+04, - "cpu_time": 2.8056875642458157e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0515049977135852e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7784586309223814e+04, - "cpu_time": 2.8053287356424582e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0531672772463265e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time_median", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7769835398261886e+04, - "cpu_time": 2.8051572581005574e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0533647085722244e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2926720324041651e+02, - "cpu_time": 1.1330140032552897e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7500095674024185e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6618614223456738e-03, - "cpu_time": 4.0387922772117265e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6616634462647728e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8826, - "real_time": 7.9748117373028523e+04, - "cpu_time": 2.8367841162474547e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0544685617294842e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8826, - "real_time": 7.9658727413601839e+04, - "cpu_time": 2.8369197337412217e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0567740073139063e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8826, - "real_time": 7.9485271903024346e+04, - "cpu_time": 2.8288674461817415e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0612623707180905e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8826, - "real_time": 7.9229827018406868e+04, - "cpu_time": 2.8284198855653702e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0679080867100251e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8826, - "real_time": 7.9537469873559312e+04, - "cpu_time": 2.8320961975980096e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0599096282601944e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9531882716324195e+04, - "cpu_time": 2.8326174758667604e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0600645309463403e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time_median", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9537469873559341e+04, - "cpu_time": 2.8320961975980102e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0599096282601944e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9766665935008120e+02, - "cpu_time": 4.1177825613286751e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1264656252626918e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4853763371240982e-03, - "cpu_time": 1.4537023076399203e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4884975923097547e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8566, - "real_time": 8.2053540718342745e+04, - "cpu_time": 2.8806988337613840e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9934900691829425e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8566, - "real_time": 8.1889746469591642e+04, - "cpu_time": 2.8799961218771833e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.0014777689130878e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8566, - "real_time": 8.1521729606258043e+04, - "cpu_time": 2.8705518841933366e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.0195418029360056e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8566, - "real_time": 8.1553944989880620e+04, - "cpu_time": 2.8695835127247160e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.0179540062796372e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8566, - "real_time": 8.2152258628065669e+04, - "cpu_time": 2.8767395773990185e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9886913089453965e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.1834244082427758e+04, - "cpu_time": 2.8755139859911276e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.0042309912514138e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time_median", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.1889746469591657e+04, - "cpu_time": 2.8767395773990185e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.0014777689130878e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8659102385985091e+02, - "cpu_time": 5.2025770105251468e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4028288047655709e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.5020916619108913e-03, - "cpu_time": 1.8092685467262404e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5033663338366870e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8020, - "real_time": 8.7139039878866126e+04, - "cpu_time": 2.9624378179551085e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.5208540386838114e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8020, - "real_time": 8.7058481544874870e+04, - "cpu_time": 2.9634466720698238e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.5278133545459366e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8020, - "real_time": 8.7131180006601644e+04, - "cpu_time": 2.9623326820448897e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.5215324749457717e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8020, - "real_time": 8.7097663537380256e+04, - "cpu_time": 2.9607293615960213e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.5244268718957663e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8020, - "real_time": 8.7138580650722884e+04, - "cpu_time": 2.9581844364089699e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.5208936742598093e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7112989123689156e+04, - "cpu_time": 2.9614261940149625e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.5231040828662193e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time_median", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7131180006601644e+04, - "cpu_time": 2.9623326820448897e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.5215324749457717e+08, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4894218977096223e+01, - "cpu_time": 2.0568181074801777e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0143642381105840e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0056275565921573e-04, - "cpu_time": 6.9453633915881610e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0068091640201590e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7191, - "real_time": 9.4524010053624123e+04, - "cpu_time": 3.1246118217215902e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3866529776470757e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7191, - "real_time": 9.4389951583834350e+04, - "cpu_time": 3.1213037240995682e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3886223883014255e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7191, - "real_time": 9.6790214781456438e+04, - "cpu_time": 3.1172400917813869e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3541864773825405e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7191, - "real_time": 9.4456254043549328e+04, - "cpu_time": 3.1189074718397990e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3876476611021316e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7191, - "real_time": 9.4252980360317699e+04, - "cpu_time": 3.1179628605200851e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3906403754971743e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4882682164556405e+04, - "cpu_time": 3.1200051939924865e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3815499759860697e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time_median", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.4456254043549328e+04, - "cpu_time": 3.1189074718397990e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3876476611021316e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0710363086187599e+03, - "cpu_time": 2.9970447795394568e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5367480476476291e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1288006242922668e-02, - "cpu_time": 9.6058967636022312e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1123361980088980e-02, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6112, - "real_time": 1.1474508862564449e+05, - "cpu_time": 3.4596641966623027e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2845770842118044e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6112, - "real_time": 1.1461435848338209e+05, - "cpu_time": 3.4553172005890211e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2871828928659768e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6112, - "real_time": 1.1517446763366539e+05, - "cpu_time": 3.4614308147905738e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2760600103991761e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6112, - "real_time": 1.1482692212328651e+05, - "cpu_time": 3.4580333949607343e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2829489387388024e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6112, - "real_time": 1.1473427873232197e+05, - "cpu_time": 3.4583089692408493e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2847923296889215e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1481902311966009e+05, - "cpu_time": 3.4585509152486961e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2831122511809363e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time_median", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1474508862564449e+05, - "cpu_time": 3.4583089692408487e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2845770842118044e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1268446742406960e+02, - "cpu_time": 2.2536910008626359e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2219454735275777e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8523452094033042e-03, - "cpu_time": 6.5162868961279354e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8492062627861519e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4419, - "real_time": 1.5870898509992743e+05, - "cpu_time": 4.1804784679791855e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3034550606564217e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4419, - "real_time": 1.5855842671720329e+05, - "cpu_time": 4.1796369155917771e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3065918403384089e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4419, - "real_time": 1.5850332219376092e+05, - "cpu_time": 4.1755643267707585e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3077413945878620e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4419, - "real_time": 1.5872892396030121e+05, - "cpu_time": 4.1786641977822955e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3030400945143857e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4419, - "real_time": 1.5896887240375424e+05, - "cpu_time": 4.1875464426340733e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2980544686031146e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5869370607498946e+05, - "cpu_time": 4.1803780701516184e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3037765717400389e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time_median", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5870898509992746e+05, - "cpu_time": 4.1796369155917771e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3034550606564217e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8147781089069761e+02, - "cpu_time": 4.4174211280471008e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7760359466085597e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1435728320878819e-03, - "cpu_time": 1.0567037368194032e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1429453126183379e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2801, - "real_time": 2.4744380099413119e+05, - "cpu_time": 5.6404454551945871e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2376329323556981e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2801, - "real_time": 2.5035907400804228e+05, - "cpu_time": 5.6490175758658000e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1882883780210686e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2801, - "real_time": 2.4752509000835661e+05, - "cpu_time": 5.6449455515887914e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2362412633183947e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2801, - "real_time": 2.5014097339381231e+05, - "cpu_time": 5.6418074973224127e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1919401918579822e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2801, - "real_time": 2.4764967856585240e+05, - "cpu_time": 5.6446983577294613e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2341100786899419e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4862372339403900e+05, - "cpu_time": 5.6441828875402105e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2176425688486171e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time_median", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4764967856585240e+05, - "cpu_time": 5.6446983577294624e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2341100786899419e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4884106312292374e+03, - "cpu_time": 3.3103042298076798e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5194174185810495e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.9865993916850971e-03, - "cpu_time": 5.8649839946103204e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9735204618556158e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1636, - "real_time": 4.2767761120971746e+05, - "cpu_time": 8.5474152689486207e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9035814478762455e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1636, - "real_time": 4.2763192383521225e+05, - "cpu_time": 8.5416843459658534e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9041053371126156e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1636, - "real_time": 4.2781677805963211e+05, - "cpu_time": 8.5471158618581621e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9019863351588430e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1636, - "real_time": 4.2804718465307466e+05, - "cpu_time": 8.5448043337408616e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8993477242461195e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1636, - "real_time": 4.2775496344502177e+05, - "cpu_time": 8.5420986430317280e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9026947182800875e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2778569224053173e+05, - "cpu_time": 8.5446236907090456e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9023431125347824e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time_median", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2775496344502189e+05, - "cpu_time": 8.5448043337408616e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9026947182800875e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6249238474118579e+02, - "cpu_time": 2.6949986678597696e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8615972703031127e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7984530031878895e-04, - "cpu_time": 3.1540285042513494e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7973622563120923e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 862, - "real_time": 8.0810976120170089e+05, - "cpu_time": 1.4774104466357152e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1902652354586754e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 862, - "real_time": 8.0760229337612586e+05, - "cpu_time": 1.4771326264501070e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1935266088287106e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 862, - "real_time": 8.0779497822305828e+05, - "cpu_time": 1.4774436856148303e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1922877872135239e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 862, - "real_time": 8.0807581215744652e+05, - "cpu_time": 1.4774725046403713e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1904832899301977e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 862, - "real_time": 8.0792582742416079e+05, - "cpu_time": 1.4775482691415397e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1914468601311245e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0790173447649856e+05, - "cpu_time": 1.4774015064965128e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1916019563124466e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time_median", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0792582742416079e+05, - "cpu_time": 1.4774436856148303e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1914468601311245e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0929673719675043e+02, - "cpu_time": 1.5869427561490158e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3450783692855968e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5906212137589957e-04, - "cpu_time": 1.0741445363165141e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5908734540985401e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 441, - "real_time": 1.5720614119139321e+06, - "cpu_time": 2.7389811995465439e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3360561721231689e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 441, - "real_time": 1.5800190115951491e+06, - "cpu_time": 2.7384551065759715e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3091816860678549e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 441, - "real_time": 1.5723204452443083e+06, - "cpu_time": 2.7334466258503790e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3351770788025160e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 441, - "real_time": 1.5804724878147920e+06, - "cpu_time": 2.7327479251700821e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3076583519643154e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 441, - "real_time": 1.5725954414647317e+06, - "cpu_time": 2.7339006507936586e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3342441284115410e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5754937596065828e+06, - "cpu_time": 2.7355063015873274e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3244634834738798e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time_median", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5725954414647317e+06, - "cpu_time": 2.7339006507936586e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3342441284115410e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3450207969251524e+03, - "cpu_time": 2.9664535116946076e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4669512154440584e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7578787731981557e-03, - "cpu_time": 1.0844257642445454e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7551155529513829e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 220, - "real_time": 3.1852891848591920e+06, - "cpu_time": 5.3633389409091072e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2670935121834631e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 220, - "real_time": 3.1872164659117432e+06, - "cpu_time": 5.3664091090908526e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2639085482387114e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 220, - "real_time": 3.1888375344516877e+06, - "cpu_time": 5.3676288136363775e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2612326023955927e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 220, - "real_time": 3.1878797263330356e+06, - "cpu_time": 5.3663101590909818e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2628133556652555e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 220, - "real_time": 3.1877968439155002e+06, - "cpu_time": 5.3673866727273576e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2629501883165541e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1874039510942320e+06, - "cpu_time": 5.3662147390909353e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2635996413599167e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time_median", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1877968439155007e+06, - "cpu_time": 5.3664091090908526e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2629501883165541e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3175047444720735e+03, - "cpu_time": 1.7095419804529120e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1763194071459272e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.1334727718454875e-04, - "cpu_time": 3.1857502235225815e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1346598438927773e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100, - "real_time": 6.6909265285357833e+06, - "cpu_time": 1.0885648220000234e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0149156259443970e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100, - "real_time": 6.7031313618645072e+06, - "cpu_time": 1.0899702510000112e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0057846383405323e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100, - "real_time": 6.6902225138619542e+06, - "cpu_time": 1.0892897329999870e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0154433474336843e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100, - "real_time": 6.7804312193766236e+06, - "cpu_time": 1.1132999339999968e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9487165217620058e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100, - "real_time": 6.7067730193957686e+06, - "cpu_time": 1.0915768220000073e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0030665870101280e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7142969286069274e+06, - "cpu_time": 1.0945403124000054e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9975853440981493e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time_median", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7031313618645072e+06, - "cpu_time": 1.0899702510000112e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 5.0057846383405323e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7685463214902433e+04, - "cpu_time": 1.0545925856459734e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7859833086673006e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.6127191894567215e-03, - "cpu_time": 9.6350273598745928e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.5746587938860937e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.4025020632235443e+07, - "cpu_time": 2.2827394745098002e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7849387006073551e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.4010997014302833e+07, - "cpu_time": 2.2794314647059057e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7897279495166063e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3996195212444838e+07, - "cpu_time": 2.2801981784313589e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7947933692957907e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.3964530774483494e+07, - "cpu_time": 2.2709169705882348e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.8056655167120829e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.4014482425124038e+07, - "cpu_time": 2.2827237980392039e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7885367410852518e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4002245211718127e+07, - "cpu_time": 2.2792019772549007e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7927324554434175e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time_median", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4010997014302835e+07, - "cpu_time": 2.2801981784313589e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7897279495166063e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3473626090760365e+04, - "cpu_time": 4.8632171762732876e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0449538371926034e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6764187268421692e-03, - "cpu_time": 2.1337368187661046e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6785735302323056e-03, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 27, - "real_time": 2.6435841081870928e+07, - "cpu_time": 4.2795387962963067e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0771120761519232e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 27, - "real_time": 2.6404617354273796e+07, - "cpu_time": 4.2740501703704059e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0831158126317558e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 27, - "real_time": 2.6409630767173238e+07, - "cpu_time": 4.2769515333333172e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0821508707660751e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 27, - "real_time": 2.6428807181892570e+07, - "cpu_time": 4.2785779518518895e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0784633251234245e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 27, - "real_time": 2.6422140223008614e+07, - "cpu_time": 4.2772966222223110e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0797447469119902e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6420207321643829e+07, - "cpu_time": 4.2772830148148462e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0801173663170347e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time_median", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6422140223008610e+07, - "cpu_time": 4.2772966222223110e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0797447469119902e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3009791982424274e+04, - "cpu_time": 2.0812712676840558e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5016138335402608e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.9241823972238311e-04, - "cpu_time": 4.8658722382300654e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.9243229105824218e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.0380702689290047e+07, - "cpu_time": 8.0095505099998832e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3281403726245394e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.0419471785426140e+07, - "cpu_time": 8.0073222300001130e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3240434001847649e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.0439391285181046e+07, - "cpu_time": 8.0002854300002471e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3219408315672045e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.0455615669488907e+07, - "cpu_time": 8.0122515700000465e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3202295212963982e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.0412702560424805e+07, - "cpu_time": 8.0015644299999163e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3247582923818159e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0421576797962189e+07, - "cpu_time": 8.0061948340000421e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3238224836109447e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time_median", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0419471785426140e+07, - "cpu_time": 8.0073222300001130e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.3240434001847649e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8416001908235583e+04, - "cpu_time": 5.1375415080759994e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0007790783594851e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.6356829184651827e-04, - "cpu_time": 6.4169578864834960e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6365122759017530e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 9.9116587804423437e+07, - "cpu_time": 1.5694365122222269e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4165596686939240e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 9.9276623792118490e+07, - "cpu_time": 1.5710115988888952e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4078280615604677e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 9.9274385306570262e+07, - "cpu_time": 1.5719449599999774e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4079499998119688e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 9.9264661471048996e+07, - "cpu_time": 1.5721402488888872e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4084797554725046e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 9.9306651287608683e+07, - "cpu_time": 1.5716372833333340e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4061928887837734e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9247781932353988e+07, - "cpu_time": 1.5712341206666642e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4094020748645287e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time_median", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9274385306570262e+07, - "cpu_time": 1.5716372833333343e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4079499998119688e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5003352269169103e+04, - "cpu_time": 1.0919950902214705e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0916603473504493e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.5571817131682027e-04, - "cpu_time": 6.9499196577919539e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5639789587149885e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7572510987520218e+08, - "cpu_time": 2.8233627925000346e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1103494245219612e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7582659423351288e+08, - "cpu_time": 2.8211971549999505e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1068226264678612e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7586971446871758e+08, - "cpu_time": 2.8231693549999905e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1053253383827457e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7594934999942780e+08, - "cpu_time": 2.8251226924999881e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1025620384701157e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7602631449699402e+08, - "cpu_time": 2.8252795099999875e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.0998937975170536e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time_mean", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7587941661477092e+08, - "cpu_time": 2.8236263009999907e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1049906450719471e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time_median", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7586971446871758e+08, - "cpu_time": 2.8233627925000346e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.1053253383827457e+09, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time_stddev", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1528721907682721e+05, - "cpu_time": 1.6696761803393063e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0018957299759821e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time_cv", - "family_index": 0, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/0/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.5549011530633555e-04, - "cpu_time": 5.9132335597950362e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.5551218054795562e-04, - "hip_id": NaN, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9324, - "real_time": 7.5152164992015300e+04, - "cpu_time": 2.7379194583869632e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3625688629313568e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9324, - "real_time": 7.5292586983273286e+04, - "cpu_time": 2.7420790744315792e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3600276481766896e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9324, - "real_time": 7.5097374841526151e+04, - "cpu_time": 2.7395141419991601e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3635629769494481e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9324, - "real_time": 7.4959766057453089e+04, - "cpu_time": 2.7378741151866247e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3660661630335838e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9324, - "real_time": 7.5115221369512554e+04, - "cpu_time": 2.7387774517374422e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3632390097909195e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5123422848756076e+04, - "cpu_time": 2.7392328483483533e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3630929321763996e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time_median", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5115221369512539e+04, - "cpu_time": 2.7387774517374422e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3632390097909195e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1934396033804019e+02, - "cpu_time": 1.7290650726512894e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1652365380311225e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5886384806814795e-03, - "cpu_time": 6.3122237808072620e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5884731605012214e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9066, - "real_time": 7.5136350816257342e+04, - "cpu_time": 2.7398657180675032e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7257112938693207e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9066, - "real_time": 7.5027600659598145e+04, - "cpu_time": 2.7370817229208030e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7296621269975305e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9066, - "real_time": 7.5161817887789584e+04, - "cpu_time": 2.7390526516655734e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7247877413735464e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9066, - "real_time": 7.5155571221360427e+04, - "cpu_time": 2.7414776472534629e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7250142161356173e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9066, - "real_time": 7.4894356776528948e+04, - "cpu_time": 2.7387086190160981e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7345184445750128e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5075139472306910e+04, - "cpu_time": 2.7392372717846878e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7279387645902056e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time_median", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5136350816257342e+04, - "cpu_time": 2.7390526516655728e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7257112938693207e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1475143179772707e+02, - "cpu_time": 1.6104484014496822e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.1744976786135601e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5284877604530541e-03, - "cpu_time": 5.8791854872813952e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5302754346249625e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9320, - "real_time": 7.5055235975639051e+04, - "cpu_time": 2.7404586437768210e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4573141323937126e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9320, - "real_time": 7.5227442818955882e+04, - "cpu_time": 2.7424614710300998e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4448215259124644e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9320, - "real_time": 7.4968970093245080e+04, - "cpu_time": 2.7407171255364758e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4635937974144071e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9320, - "real_time": 7.4838514929811427e+04, - "cpu_time": 2.7395978766094596e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4731176905922070e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9320, - "real_time": 7.5037107614970460e+04, - "cpu_time": 2.7404948980686505e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4586325755216308e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5025454286524386e+04, - "cpu_time": 2.7407460030043015e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4594959443668842e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time_median", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5037107614970460e+04, - "cpu_time": 2.7404948980686505e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4586325755216308e+07, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4138502703566732e+02, - "cpu_time": 1.0497008736444836e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0285774595284498e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8844941144336668e-03, - "cpu_time": 3.8299823204844281e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8840154292810447e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9010, - "real_time": 7.5905982766047964e+04, - "cpu_time": 2.7638487014428136e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0792298184517024e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9010, - "real_time": 7.5814047302671141e+04, - "cpu_time": 2.7635072674806265e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0805385402121082e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9010, - "real_time": 7.5837705329999371e+04, - "cpu_time": 2.7616268867924850e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0802014597294867e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9010, - "real_time": 7.5798828179706936e+04, - "cpu_time": 2.7618348690344236e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0807554940794170e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9010, - "real_time": 7.5805755934700501e+04, - "cpu_time": 2.7628844350721227e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0806567257315704e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5832463902625197e+04, - "cpu_time": 2.7627404319644946e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0802764076408571e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time_median", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5814047302671155e+04, - "cpu_time": 2.7628844350721233e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0805385402121082e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3635835033303657e+01, - "cpu_time": 9.8704887218108723e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2125785105703093e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7542420208494724e-04, - "cpu_time": 3.5727166430877074e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7509156606849732e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9265, - "real_time": 7.7490174436382091e+04, - "cpu_time": 2.7937923961144482e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1143325743124944e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9265, - "real_time": 7.7426883800117837e+04, - "cpu_time": 2.7894457323260029e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1160608816824245e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9265, - "real_time": 7.7667860305140319e+04, - "cpu_time": 2.7924453696708527e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1094954767172402e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9265, - "real_time": 7.7377732675605497e+04, - "cpu_time": 2.7889191991365561e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1174050251236302e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9265, - "real_time": 7.7498276538343242e+04, - "cpu_time": 2.7926115434430278e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1141115301956183e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7492185551117800e+04, - "cpu_time": 2.7914428481381777e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1142810976062813e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time_median", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7490174436382105e+04, - "cpu_time": 2.7924453696708521e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1143325743124944e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0984823998316847e+02, - "cpu_time": 2.1359160604890303e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9941661922812503e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4175395777256399e-03, - "cpu_time": 7.6516560670895786e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4161627778213339e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8787, - "real_time": 7.9439838367629418e+04, - "cpu_time": 2.8283462831456109e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1248825115123200e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8787, - "real_time": 7.9484920661395241e+04, - "cpu_time": 2.8305167554341676e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1225429587570786e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8787, - "real_time": 7.9418495194291711e+04, - "cpu_time": 2.8299043302606524e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1259910452641308e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8787, - "real_time": 7.9441346464894814e+04, - "cpu_time": 2.8295980539433140e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1248042056387103e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8787, - "real_time": 7.9468860589282849e+04, - "cpu_time": 2.8301037248207675e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1233760943615544e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9450692255498812e+04, - "cpu_time": 2.8296938295209024e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1243193631067586e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time_median", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9441346464894799e+04, - "cpu_time": 2.8299043302606524e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1248042056387103e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6189089133495280e+01, - "cpu_time": 8.2380003173886934e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3594206486588321e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.2962694710419880e-04, - "cpu_time": 2.9112691385355550e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2961090763708716e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8246, - "real_time": 8.4696899785613845e+04, - "cpu_time": 2.9201278098472086e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7377094280765617e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8246, - "real_time": 8.4725037966082062e+04, - "cpu_time": 2.9185642893524340e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7351396438719797e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8246, - "real_time": 8.4599807737781142e+04, - "cpu_time": 2.9177455032743211e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7465897089423871e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8246, - "real_time": 8.4760043176111052e+04, - "cpu_time": 2.9190100945913396e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7319450939674366e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8246, - "real_time": 8.4659220755574381e+04, - "cpu_time": 2.9196456560756330e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7411532276222599e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4688201884232505e+04, - "cpu_time": 2.9190186706281872e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7385074204961264e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time_median", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4696899785613845e+04, - "cpu_time": 2.9190100945913396e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7377094280765617e+08, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.1739680457131286e+01, - "cpu_time": 9.2881531669333327e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6428388812724396e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.2902339503592842e-04, - "cpu_time": 3.1819437334857731e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.2918956778756565e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7354, - "real_time": 9.1966116547431040e+04, - "cpu_time": 3.0816895580636361e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4252205586217213e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7354, - "real_time": 9.4885934788595288e+04, - "cpu_time": 3.0777875197171140e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3813638479931383e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7354, - "real_time": 9.1913557432849062e+04, - "cpu_time": 3.0729356663040316e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4260355453629310e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7354, - "real_time": 9.1937948933060805e+04, - "cpu_time": 3.0766336429154535e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4256572125122385e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7354, - "real_time": 9.4675557681871054e+04, - "cpu_time": 3.0746958430786361e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3844333554435279e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3075823076761473e+04, - "cpu_time": 3.0767484460157744e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4085421039867115e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time_median", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1966116547431055e+04, - "cpu_time": 3.0766336429154535e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4252205586217213e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5582620761006217e+03, - "cpu_time": 3.3263309417701311e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3436124014036108e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6741856527183137e-02, - "cpu_time": 1.0811189150278283e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6638568309532909e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6184, - "real_time": 1.1316918665687587e+05, - "cpu_time": 3.4268131516817742e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3163902449419327e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6184, - "real_time": 1.1327700101908488e+05, - "cpu_time": 3.4272374142949370e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3141855596603770e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6184, - "real_time": 1.1297093010721942e+05, - "cpu_time": 3.4250612597024674e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3204553574198432e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6184, - "real_time": 1.1307153780989825e+05, - "cpu_time": 3.4261759152651206e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3183906850257058e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6184, - "real_time": 1.1326781771812777e+05, - "cpu_time": 3.4266434411384532e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3143731845558949e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1315129466224124e+05, - "cpu_time": 3.4263862364165502e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3167590063207507e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time_median", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1316918665687589e+05, - "cpu_time": 3.4266434411384526e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3163902449419327e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3095071819006762e+02, - "cpu_time": 8.3257326611190564e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6821700639892318e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1573064062674490e-03, - "cpu_time": 2.4298873759855032e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1577251050590674e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4431, - "real_time": 1.5789855943665479e+05, - "cpu_time": 4.1628248792597128e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3204102803124819e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4431, - "real_time": 1.5777160236391795e+05, - "cpu_time": 4.1603898375085159e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3230821779363737e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4431, - "real_time": 1.5777719608597693e+05, - "cpu_time": 4.1619881832543097e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3229643637113547e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4431, - "real_time": 1.5791993607861301e+05, - "cpu_time": 4.1626227691265865e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3199608169737859e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4431, - "real_time": 1.5761199650776942e+05, - "cpu_time": 4.1621984924395819e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3264472985351434e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5779585809458641e+05, - "cpu_time": 4.1620048323177412e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3225729874938278e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time_median", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5777719608597693e+05, - "cpu_time": 4.1621984924395813e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3229643637113547e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2317122830532601e+02, - "cpu_time": 9.6180982726987438e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5943917153120884e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8057326594399199e-04, - "cpu_time": 2.3109291459766539e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8083814112658606e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2852, - "real_time": 2.4834617865204110e+05, - "cpu_time": 5.6295093969143729e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2222352914443851e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2852, - "real_time": 2.4542003848437621e+05, - "cpu_time": 5.6266944214585959e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2725769520517530e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2852, - "real_time": 2.4837091855598983e+05, - "cpu_time": 5.6292190322581318e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2218147200821395e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2852, - "real_time": 2.4549606088360318e+05, - "cpu_time": 5.6281518022439245e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2712538695158963e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2852, - "real_time": 2.4839319223175567e+05, - "cpu_time": 5.6269007187937782e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2214361455673800e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4720527776155324e+05, - "cpu_time": 5.6280950743337604e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2418633957323108e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time_median", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4834617865204107e+05, - "cpu_time": 5.6281518022439233e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2222352914443851e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5953068438970563e+03, - "cpu_time": 1.2898761065119669e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7439054801400140e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.4533688695588513e-03, - "cpu_time": 2.2918520200454487e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4686323536505804e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1644, - "real_time": 4.2588470688224555e+05, - "cpu_time": 8.4994227737226116e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9242247164790764e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1644, - "real_time": 4.2585988942286745e+05, - "cpu_time": 8.4994459975667833e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9245116811590223e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1644, - "real_time": 4.2588256343116035e+05, - "cpu_time": 8.5003572810220323e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9242494999187346e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1644, - "real_time": 4.2575428679366224e+05, - "cpu_time": 8.5018429927006806e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9257331401019220e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1644, - "real_time": 4.2561852151398838e+05, - "cpu_time": 8.4963109489052126e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9273043676297693e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2579999360878486e+05, - "cpu_time": 8.4994759987834655e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9252046810577049e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time_median", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2585988942286745e+05, - "cpu_time": 8.4994459975667833e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9245116811590223e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1467656341599775e+02, - "cpu_time": 2.0248822331756710e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3267350081157880e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6932025631113538e-04, - "cpu_time": 2.3823612578769486e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6937662372051246e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 866, - "real_time": 8.0451549339488870e+05, - "cpu_time": 1.4714187424942004e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2134533572509661e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 866, - "real_time": 8.0416426863779442e+05, - "cpu_time": 1.4706190219399640e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2157303719859343e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 866, - "real_time": 8.0493268255503557e+05, - "cpu_time": 1.4719703083141122e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2107512726236258e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 866, - "real_time": 8.0450404510407452e+05, - "cpu_time": 1.4713251374134433e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2135275459769812e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 866, - "real_time": 8.0443328529043566e+05, - "cpu_time": 1.4707835369514623e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2139861399266605e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0450995499644580e+05, - "cpu_time": 1.4712233494226367e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2134897375528336e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time_median", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0450404510407464e+05, - "cpu_time": 1.4713251374134435e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2135275459769812e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7574512300962073e+02, - "cpu_time": 5.3970676029928882e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7866729665162563e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.4274917457154265e-04, - "cpu_time": 3.6684216608653611e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4270192451839467e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 446, - "real_time": 1.5753160680815445e+06, - "cpu_time": 2.7306748071747981e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3250316999659863e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 446, - "real_time": 1.5718174465063275e+06, - "cpu_time": 2.7267315627802936e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3368843936968164e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 446, - "real_time": 1.5749218445605361e+06, - "cpu_time": 2.7300084461882305e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3263646249955635e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 446, - "real_time": 1.5734147059630952e+06, - "cpu_time": 2.7306240874439217e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3314666300041285e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 446, - "real_time": 1.5755861135191314e+06, - "cpu_time": 2.7304507376681161e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3241190234050274e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5742112357261269e+06, - "cpu_time": 2.7296979282510718e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3287732744135046e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time_median", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5749218445605361e+06, - "cpu_time": 2.7304507376681161e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3263646249955635e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5796039763092067e+03, - "cpu_time": 1.6788784055713259e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.3504075583678670e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0034256778637413e-03, - "cpu_time": 6.1504182869310728e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0040598995003673e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 220, - "real_time": 3.1792140153067354e+06, - "cpu_time": 5.3560008181818835e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2771584168992500e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 220, - "real_time": 3.1801726108162920e+06, - "cpu_time": 5.3577139409092274e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2755677295433340e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 220, - "real_time": 3.1795086095702243e+06, - "cpu_time": 5.3553246590909837e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2766694669424992e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 220, - "real_time": 3.1767579853873360e+06, - "cpu_time": 5.3539669181816401e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2812383181762543e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 220, - "real_time": 3.1803027906624433e+06, - "cpu_time": 5.3584681272726897e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2753517838801069e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1791912023486067e+06, - "cpu_time": 5.3562948927272847e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2771971430882902e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time_median", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1795086095702248e+06, - "cpu_time": 5.3560008181818826e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2766694669424992e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4335797596203142e+03, - "cpu_time": 1.8154851125881312e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3807234708130215e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5092593316226677e-04, - "cpu_time": 3.3894420470634957e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5113407861427525e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100, - "real_time": 7.1065133670344949e+06, - "cpu_time": 1.1948709510000413e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7216448160994682e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100, - "real_time": 7.1104654856026173e+06, - "cpu_time": 1.1938254599999709e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7190204449963989e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100, - "real_time": 7.1095663262531161e+06, - "cpu_time": 1.1921918859999893e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7196172678065243e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100, - "real_time": 7.1137839974835515e+06, - "cpu_time": 1.1942890999999918e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7168190673022451e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100, - "real_time": 7.0096231997013092e+06, - "cpu_time": 1.1602646649999999e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7869095162532854e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0899904752150178e+06, - "cpu_time": 1.1870884123999987e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7328022224915838e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time_median", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1095663262531161e+06, - "cpu_time": 1.1938254599999709e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7196172678065243e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5001323935543456e+04, - "cpu_time": 1.5028011234890897e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0295744859892122e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.3471628195916150e-03, - "cpu_time": 1.2659555158581644e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4012277369035987e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 49, - "real_time": 1.4392152808758678e+07, - "cpu_time": 2.3773366755102526e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6628787848305330e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 49, - "real_time": 1.4390190284014964e+07, - "cpu_time": 2.3765079775510188e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6635147051909695e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 49, - "real_time": 1.4379852090258988e+07, - "cpu_time": 2.3741692428571623e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6668674739331999e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 49, - "real_time": 1.4290685746438649e+07, - "cpu_time": 2.3493958857142974e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6959862662100773e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 49, - "real_time": 1.4400401019624302e+07, - "cpu_time": 2.3767605142856322e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6602079975791416e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4370656389819119e+07, - "cpu_time": 2.3708340591836728e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6698910455487843e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time_median", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4390190284014964e+07, - "cpu_time": 2.3765079775510188e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6635147051909695e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5299770311501765e+04, - "cpu_time": 1.2044905257427278e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4779153066072494e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1522408637920229e-03, - "cpu_time": 5.0804505742483670e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1647747071443110e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.6610708365646694e+07, - "cpu_time": 4.3352412423075750e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0437487854802637e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.6803725112516146e+07, - "cpu_time": 4.3448223692306645e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0074281629356918e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.6795497235770408e+07, - "cpu_time": 4.3418737230767258e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0089657534261856e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.6732672292452592e+07, - "cpu_time": 4.3413806423077315e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0207374156864052e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.6816506655170366e+07, - "cpu_time": 4.3370240538461775e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0050414741146793e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6751821932311244e+07, - "cpu_time": 4.3400684061537758e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0171843183286457e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time_median", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6795497235770412e+07, - "cpu_time": 4.3413806423077315e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0089657534261856e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5242790050731011e+04, - "cpu_time": 3.8778502300728083e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6034895217857832e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1864293305486424e-03, - "cpu_time": 8.9349979474388276e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1959948450128841e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.1034783199429512e+07, - "cpu_time": 8.0989923599997848e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2598529702973375e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.1072863116860390e+07, - "cpu_time": 8.1064759899999216e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2559312248813982e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.1090016588568687e+07, - "cpu_time": 8.1035881799999744e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2541665461126900e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.1011231169104576e+07, - "cpu_time": 8.1000039500003129e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2622814593540020e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.1019582524895668e+07, - "cpu_time": 8.1058970100002617e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2614200805938272e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1045695319771767e+07, - "cpu_time": 8.1029914980000526e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2587304562478514e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time_median", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1034783199429512e+07, - "cpu_time": 8.1035881799999744e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2598529702973375e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4246146406524596e+04, - "cpu_time": 3.3859364173007707e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5273471591891833e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7089195654975982e-04, - "cpu_time": 4.1786251634800241e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7076021266660910e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 8.2808495395713389e+07, - "cpu_time": 1.5344536566666672e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.4832830186622534e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 8.2801898320515946e+07, - "cpu_time": 1.5342250722222340e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.4837995612351646e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 8.2858967284361526e+07, - "cpu_time": 1.5355789011111179e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.4793338560149651e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 8.2826433082421616e+07, - "cpu_time": 1.5342590700000376e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.4818789367127886e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 8.2753898368941411e+07, - "cpu_time": 1.5341328888889113e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.4875603757839937e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2809938490390792e+07, - "cpu_time": 1.5345299177777940e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.4831711496818333e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time_median", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2808495395713389e+07, - "cpu_time": 1.5342590700000378e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.4832830186622534e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8350737490895430e+04, - "cpu_time": 5.9793458239469866e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0028052948934268e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6311757006492195e-04, - "cpu_time": 3.8965325828289388e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6316921542951893e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.7992122471332550e+08, - "cpu_time": 2.7860801674999893e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9678441257324076e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.7943850159645081e+08, - "cpu_time": 2.7833930799999964e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9838987421707163e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.7965969815850258e+08, - "cpu_time": 2.7829260549999899e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9765313813045835e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.7994965612888336e+08, - "cpu_time": 2.7867571625000662e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9669012272575045e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.7952642217278481e+08, - "cpu_time": 2.7828715775000036e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9809682107215366e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time_mean", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7969910055398941e+08, - "cpu_time": 2.7844056085000092e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9752287374373493e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time_median", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7965969815850258e+08, - "cpu_time": 2.7833930799999964e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.9765313813045835e+09, - "hip_id": 1.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time_stddev", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2989096710513532e+05, - "cpu_time": 1.8642356138665709e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.6434176347495234e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time_cv", - "family_index": 1, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/1/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2793106164494469e-03, - "cpu_time": 6.6952731605466622e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2791841066870397e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8934, - "real_time": 7.8131708223486072e+04, - "cpu_time": 2.8120728800089529e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3106074643485012e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8934, - "real_time": 7.8202055855512925e+04, - "cpu_time": 2.8119730378330580e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3094284911025291e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8934, - "real_time": 7.8411000949025300e+04, - "cpu_time": 2.8107535146631126e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3059392019057360e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8934, - "real_time": 7.8338919414926830e+04, - "cpu_time": 2.8104769498544786e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3071408281448483e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8934, - "real_time": 7.8163335267924005e+04, - "cpu_time": 2.8086876158496132e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3100771563674821e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8249403942175035e+04, - "cpu_time": 2.8107927996418427e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3086386283738194e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time_median", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8202055855512939e+04, - "cpu_time": 2.8107535146631126e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3094284911025291e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2002973868928011e+02, - "cpu_time": 1.3751973615781944e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0062321522765316e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5339380575726815e-03, - "cpu_time": 4.8925604254907188e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5330681127528516e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9016, - "real_time": 7.8272066854153585e+04, - "cpu_time": 2.8113004026175541e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6165145272273090e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9016, - "real_time": 7.8221748438384107e+04, - "cpu_time": 2.8103028604702838e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6181976763319552e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9016, - "real_time": 7.8537176412197325e+04, - "cpu_time": 2.8137978737799363e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6076822386015046e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9016, - "real_time": 7.8563104539748034e+04, - "cpu_time": 2.8106313986247254e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6068216270193845e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9016, - "real_time": 7.8482502010693439e+04, - "cpu_time": 2.8097309216947528e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6094988660287037e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8415319651035301e+04, - "cpu_time": 2.8111526914374507e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6117429870417714e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time_median", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8482502010693439e+04, - "cpu_time": 2.8106313986247254e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6094988660287037e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5747546729428430e+02, - "cpu_time": 1.5838399765153989e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2482413974230454e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0082232399878408e-03, - "cpu_time": 5.6341300184072193e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0094785066763180e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8830, - "real_time": 7.8043685151673562e+04, - "cpu_time": 2.8094945990940329e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2483426327699050e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8830, - "real_time": 7.8225704569690977e+04, - "cpu_time": 2.8082965209513338e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2361305309188865e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8830, - "real_time": 7.8367747809973385e+04, - "cpu_time": 2.8089848505096021e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2266399309215911e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8830, - "real_time": 7.8519213858680450e+04, - "cpu_time": 2.8114022763307311e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2165575770689905e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8830, - "real_time": 7.8453962728834696e+04, - "cpu_time": 2.8100085164212674e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2208962524394840e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8322062823770626e+04, - "cpu_time": 2.8096373526613938e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2297133848237716e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time_median", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8367747809973400e+04, - "cpu_time": 2.8094945990940335e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2266399309215911e+07, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9048115059727476e+02, - "cpu_time": 1.1722505496337348e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2732751696903541e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.4320241797751020e-03, - "cpu_time": 4.1722485947281958e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4346939803341831e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8737, - "real_time": 7.8948821625911311e+04, - "cpu_time": 2.8347757582694339e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0376342333286141e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8737, - "real_time": 7.9026173352290192e+04, - "cpu_time": 2.8365889893556002e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0366185850200468e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8737, - "real_time": 7.9015534070152644e+04, - "cpu_time": 2.8309324779672513e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0367581636196835e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8737, - "real_time": 7.9332020824697393e+04, - "cpu_time": 2.8355881584067672e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0326221259511510e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8737, - "real_time": 7.9146161748084516e+04, - "cpu_time": 2.8329476879936183e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0350470343810780e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9093742324227205e+04, - "cpu_time": 2.8341666143985343e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0357360284601146e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time_median", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9026173352290192e+04, - "cpu_time": 2.8347757582694339e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0366185850200468e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5100376283159923e+02, - "cpu_time": 2.2475077355521859e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9747119895063178e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9091745869425786e-03, - "cpu_time": 7.9300480223501283e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9065784478331125e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8569, - "real_time": 8.0586958651769237e+04, - "cpu_time": 2.8581227191037498e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0330833020759866e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8569, - "real_time": 8.0839816575512552e+04, - "cpu_time": 2.8621226735908823e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0267240444188401e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8569, - "real_time": 8.0429866935637241e+04, - "cpu_time": 2.8550313805577427e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0370542217993525e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8569, - "real_time": 8.0588391188393594e+04, - "cpu_time": 2.8615640424785874e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0330471620532408e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8569, - "real_time": 8.0711892475251225e+04, - "cpu_time": 2.8613404854708869e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0299362953264716e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0631385165312779e+04, - "cpu_time": 2.8596362602403696e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0319690051347783e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time_median", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0588391188393580e+04, - "cpu_time": 2.8613404854708863e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0330471620532408e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5358781995847505e+02, - "cpu_time": 3.0124202481579511e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8699170086708578e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9048143553975279e-03, - "cpu_time": 1.0534277698327754e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9045157671655382e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8484, - "real_time": 8.3216442013707609e+04, - "cpu_time": 2.9030878948609869e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9376833720675510e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8484, - "real_time": 8.3269678131304914e+04, - "cpu_time": 2.9067873962753057e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9351659253839481e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8484, - "real_time": 8.3108827260205464e+04, - "cpu_time": 2.9007361232908262e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9427821424319530e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8484, - "real_time": 8.3395034515875828e+04, - "cpu_time": 2.9039563920320204e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9292507270036554e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8484, - "real_time": 8.3166780107375147e+04, - "cpu_time": 2.9007765051861666e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9400347058878338e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3231352405693804e+04, - "cpu_time": 2.9030688623290614e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9369833745549881e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time_median", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.3216442013707609e+04, - "cpu_time": 2.9030878948609869e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9376833720675510e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0916158575195384e+02, - "cpu_time": 2.5155585173878890e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.1605059821688029e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3115440587805006e-03, - "cpu_time": 8.6651699862528165e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3107766762545992e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7833, - "real_time": 8.8461863511395291e+04, - "cpu_time": 2.9942347491383139e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.4083901693477130e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7833, - "real_time": 8.8519569190682028e+04, - "cpu_time": 2.9995666807098064e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.4035606588671255e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7833, - "real_time": 8.8200877497790876e+04, - "cpu_time": 2.9846402080940834e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.4303115636963415e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7833, - "real_time": 8.8322149919352567e+04, - "cpu_time": 2.9881979394866771e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.4201092319244123e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7833, - "real_time": 8.8399602102668199e+04, - "cpu_time": 2.9854856070470269e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.4136080300322866e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8380812444377807e+04, - "cpu_time": 2.9904250368951814e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.4151959307735765e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time_median", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8399602102668214e+04, - "cpu_time": 2.9881979394866771e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.4136080300322866e+08, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2449260841844156e+02, - "cpu_time": 6.3424311852437563e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0450385835939264e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4085931660425799e-03, - "cpu_time": 2.1209129494945663e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4093202571451200e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7292, - "real_time": 9.8764271379881247e+04, - "cpu_time": 3.1439947696105659e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3271195966793716e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7292, - "real_time": 9.6089997309636135e+04, - "cpu_time": 3.1468632707077247e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3640545704006987e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7292, - "real_time": 9.5775014587886326e+04, - "cpu_time": 3.1413840729565802e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3685406425046690e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7292, - "real_time": 9.8574751912635606e+04, - "cpu_time": 3.1404121050465934e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3296711120933473e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7292, - "real_time": 9.6061094464038193e+04, - "cpu_time": 3.1431976686780038e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3644649869054804e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7053025930815507e+04, - "cpu_time": 3.1431703773998935e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3507701817167137e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time_median", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6089997309636135e+04, - "cpu_time": 3.1431976686780044e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3640545704006987e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4822850690192085e+03, - "cpu_time": 2.5058321099128452e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0520312254318159e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5272940279841033e-02, - "cpu_time": 7.9723076035914089e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5191564436400715e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 5958, - "real_time": 1.1740623083200750e+05, - "cpu_time": 3.5038178113459953e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2327946152627349e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 5958, - "real_time": 1.1722764336827341e+05, - "cpu_time": 3.4984756411546806e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2361961092783251e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 5958, - "real_time": 1.1717272489693336e+05, - "cpu_time": 3.5004788939241541e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2372442070506191e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 5958, - "real_time": 1.1702821545290596e+05, - "cpu_time": 3.4976838032897661e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2400068136174474e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 5958, - "real_time": 1.1731607596527779e+05, - "cpu_time": 3.5023831537428679e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2345104696272583e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1723017810307963e+05, - "cpu_time": 3.5005678606914927e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2361504429672771e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time_median", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1722764336827339e+05, - "cpu_time": 3.5004788939241541e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2361961092783251e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4358726781684402e+02, - "cpu_time": 2.5768465657474201e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7395753324630442e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2248319514672136e-03, - "cpu_time": 7.3612244307082110e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2251301521680016e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4345, - "real_time": 1.6150350031502958e+05, - "cpu_time": 4.2380869666282862e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2462949656033530e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4345, - "real_time": 1.6135477488517540e+05, - "cpu_time": 4.2346659677788877e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2492871709132757e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4345, - "real_time": 1.6094436895818170e+05, - "cpu_time": 4.2162465431528958e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2575728085039506e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4345, - "real_time": 1.6094285608146025e+05, - "cpu_time": 4.2218170540850691e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2576034299691734e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4345, - "real_time": 1.6089089612542975e+05, - "cpu_time": 4.2234799148446269e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2586554778790445e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6112727927305532e+05, - "cpu_time": 4.2268592892979534e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2538827705737596e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time_median", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6094436895818167e+05, - "cpu_time": 4.2234799148446263e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2575728085039506e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.8135458736466660e+02, - "cpu_time": 9.1716908952656081e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6774277138859285e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7461635834355978e-03, - "cpu_time": 2.1698595263124911e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7448163053780895e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2802, - "real_time": 2.5237423824526963e+05, - "cpu_time": 5.6995209386154229e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1548456264420404e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2802, - "real_time": 2.4953578669801526e+05, - "cpu_time": 5.7014796716628282e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2021066952972641e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2802, - "real_time": 2.5235630564280596e+05, - "cpu_time": 5.7007964846536098e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1551408724622536e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2802, - "real_time": 2.4951705652387810e+05, - "cpu_time": 5.6966288258385938e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2024221294052262e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2802, - "real_time": 2.5231439268891548e+05, - "cpu_time": 5.6981067630266538e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1558310995473595e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5121955595977692e+05, - "cpu_time": 5.6993065367594222e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1740692846308289e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time_median", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5231439268891551e+05, - "cpu_time": 5.6995209386154229e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1558310995473595e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5457798793668092e+03, - "cpu_time": 1.9747164987276739e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5741238413322698e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1531033022536909e-03, - "cpu_time": 3.4648364428042884e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1669408574753339e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1628, - "real_time": 4.2988252260047756e+05, - "cpu_time": 8.5769344656025467e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8784304775029030e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1628, - "real_time": 4.2967014111614507e+05, - "cpu_time": 8.5728095761672314e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8808418349766464e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1628, - "real_time": 4.2980742363413086e+05, - "cpu_time": 8.5766990417691076e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8792828710775814e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1628, - "real_time": 4.2956839124666393e+05, - "cpu_time": 8.5759760135139641e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8819979373104925e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1628, - "real_time": 4.2978274708980444e+05, - "cpu_time": 8.5777870085994445e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8795630215509634e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2974224513744441e+05, - "cpu_time": 8.5760412211304589e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8800232284837179e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time_median", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2978274708980444e+05, - "cpu_time": 8.5766990417691076e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8795630215509634e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2348135105707345e+02, - "cpu_time": 1.9187345323899416e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4023521963330039e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.8733817178616086e-04, - "cpu_time": 2.2373196244234258e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8736588550393676e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 862, - "real_time": 8.0816061288634804e+05, - "cpu_time": 1.4772045023202258e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1899386497196770e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 862, - "real_time": 8.0797611587203329e+05, - "cpu_time": 1.4774140777262801e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1911237443858938e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 862, - "real_time": 8.0791152177730750e+05, - "cpu_time": 1.4767057227378213e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1915387848078203e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 862, - "real_time": 8.0813464173547958e+05, - "cpu_time": 1.4778916287702979e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1901054395993690e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 862, - "real_time": 8.0812646436943673e+05, - "cpu_time": 1.4773516856149007e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1901579578546820e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0806187132812093e+05, - "cpu_time": 1.4773135234339049e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1905729152734890e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time_median", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0812646436943661e+05, - "cpu_time": 1.4773516856149007e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1901579578546820e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1087907161876487e+02, - "cpu_time": 4.2634510344099380e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1227322757492436e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3721606668128683e-04, - "cpu_time": 2.8859486945600170e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3722439491776120e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 445, - "real_time": 1.5800152941910403e+06, - "cpu_time": 2.7295567011235743e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3091941773227730e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 445, - "real_time": 1.5717226140766165e+06, - "cpu_time": 2.7307849146067835e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3372064032611055e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 445, - "real_time": 1.5799893926975599e+06, - "cpu_time": 2.7301415303370734e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3092812133870697e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 445, - "real_time": 1.5709092903338121e+06, - "cpu_time": 2.7300141887641135e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3399696924686546e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 445, - "real_time": 1.5796162214213877e+06, - "cpu_time": 2.7295194629214476e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3105354871904707e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5764505625440832e+06, - "cpu_time": 2.7300033595505985e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3212373947260151e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time_median", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5796162214213877e+06, - "cpu_time": 2.7300141887641135e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3105354871904707e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.6987025101864238e+03, - "cpu_time": 5.1567829980663328e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5877880800217642e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.9805581106226607e-03, - "cpu_time": 1.8889291765982367e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9838700329277786e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 220, - "real_time": 3.1861429917626083e+06, - "cpu_time": 5.3590537272730842e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2656820624107218e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 220, - "real_time": 3.1843654980713669e+06, - "cpu_time": 5.3572608727274034e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2686213345048599e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 220, - "real_time": 3.1854622563431887e+06, - "cpu_time": 5.3585612681822367e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2668073421970854e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 220, - "real_time": 3.1861051451414824e+06, - "cpu_time": 5.3604019318186138e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2657446115937862e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 220, - "real_time": 3.1855262265625326e+06, - "cpu_time": 5.3577212727273861e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2667015766823921e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1855204235762358e+06, - "cpu_time": 5.3585998145457450e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2667113854777689e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time_median", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1855262265625326e+06, - "cpu_time": 5.3585612681822358e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2667015766823921e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1881160248536662e+02, - "cpu_time": 1.2267589563877473e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1886301919099987e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2564966062229484e-04, - "cpu_time": 2.2893274341139451e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2568736065307901e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 100, - "real_time": 7.0546700945124030e+06, - "cpu_time": 1.1733475930000167e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7563431812496653e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 100, - "real_time": 7.1264962712302804e+06, - "cpu_time": 1.1948753700000906e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7084051857936831e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 100, - "real_time": 6.8996255705133080e+06, - "cpu_time": 1.1212203989999807e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.8632250630237703e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 100, - "real_time": 7.0510380715131760e+06, - "cpu_time": 1.1765065190000996e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7587931960774546e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 100, - "real_time": 7.1213378477841616e+06, - "cpu_time": 1.1942133170000488e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7118157735544901e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0506335711106658e+06, - "cpu_time": 1.1720326396000475e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7597164799398127e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time_median", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0546700945124049e+06, - "cpu_time": 1.1765065190000996e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7563431812496653e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1616206802506320e+04, - "cpu_time": 3.0072417911528522e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2557143773407049e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2994038887213687e-02, - "cpu_time": 2.5658345079699014e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3143039934638731e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50, - "real_time": 1.4358119666576385e+07, - "cpu_time": 2.3649018159999285e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6739312360113335e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50, - "real_time": 1.4380571041256189e+07, - "cpu_time": 2.3745463220000148e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6666341557280626e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50, - "real_time": 1.4390750322490931e+07, - "cpu_time": 2.3766411699998569e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6633332172483940e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50, - "real_time": 1.4347553234547377e+07, - "cpu_time": 2.3665596419998564e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6773734101511478e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50, - "real_time": 1.4371873345226049e+07, - "cpu_time": 2.3684911860000286e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6694583502081699e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4369773522019390e+07, - "cpu_time": 2.3702280271999370e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6701460738694220e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time_median", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4371873345226049e+07, - "cpu_time": 2.3684911860000286e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6694583502081699e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7252357514184718e+04, - "cpu_time": 5.1141534888472001e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6076597246837290e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2006005166155353e-03, - "cpu_time": 2.1576630729866074e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2007461085767571e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.6888132238617308e+07, - "cpu_time": 4.3679104384615093e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9917088628132238e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.6818045701545019e+07, - "cpu_time": 4.3608271499998897e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0047542424863405e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.6906218093175154e+07, - "cpu_time": 4.3764465230769753e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9883535298498430e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.6839264095402680e+07, - "cpu_time": 4.3674642923073970e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0007976195960703e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.6832328607829716e+07, - "cpu_time": 4.3639296653846212e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0020902010284357e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6856797747313976e+07, - "cpu_time": 4.3673156138460793e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9975408911547823e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time_median", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6839264095402680e+07, - "cpu_time": 4.3674642923073970e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0007976195960703e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8184125360944730e+04, - "cpu_time": 5.8590578391117335e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1020261239733556e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4217676180237695e-03, - "cpu_time": 1.3415695949558245e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4211041547540573e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.1054961234331131e+07, - "cpu_time": 8.0973996699992761e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2577741616126165e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.1040897145867348e+07, - "cpu_time": 8.0992308999998391e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2592229175135994e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.1056816801428795e+07, - "cpu_time": 8.1009095699994296e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2575830773783760e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.1083281636238098e+07, - "cpu_time": 8.1061215299996540e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2548592690563145e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.1099408790469170e+07, - "cpu_time": 8.1077404799998477e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2532008168765230e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1067073121666908e+07, - "cpu_time": 8.1022804299996108e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2565280484874859e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time_median", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.1056816801428795e+07, - "cpu_time": 8.1009095699994296e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2575830773783760e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.3692736486831425e+04, - "cpu_time": 4.4600141195923708e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4384163894462325e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.6395328806849112e-04, - "cpu_time": 5.5046405245104380e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.6388345443107887e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 8.8904720731079578e+07, - "cpu_time": 1.5475204137500498e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0387222139073553e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 8.8871059939265251e+07, - "cpu_time": 1.5472776562499747e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0410094395959625e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 8.8820379227399826e+07, - "cpu_time": 1.5496675762500444e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0444564262160110e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 8.9015362784266472e+07, - "cpu_time": 1.5483108575000414e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0312163564522629e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 8.8900898583233356e+07, - "cpu_time": 1.5481085275000340e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0389818388320932e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8902484253048912e+07, - "cpu_time": 1.5481770062500289e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0388772550007372e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time_median", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8900898583233356e+07, - "cpu_time": 1.5481085275000340e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 6.0389818388320932e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.1550334924568422e+04, - "cpu_time": 9.3332049083835504e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.8579240598099101e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0481817269481548e-04, - "cpu_time": 6.0285128061618085e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0444159645522010e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8375889211893082e+08, - "cpu_time": 2.8148274099999070e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8432101522742214e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8359233438968658e+08, - "cpu_time": 2.8163505149998969e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8485112004780855e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8404061719775200e+08, - "cpu_time": 2.8175963775001377e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8342655026322927e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8408229574561119e+08, - "cpu_time": 2.8151237675001538e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8329445515164356e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8375937268137932e+08, - "cpu_time": 2.8161753624999619e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8431948712720232e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time_mean", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8384670242667201e+08, - "cpu_time": 2.8160146865000117e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8404252556346130e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time_median", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8375937268137932e+08, - "cpu_time": 2.8161753624999619e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.8431948712720232e+09, - "hip_id": 2.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time_stddev", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.0805491052082609e+05, - "cpu_time": 1.1004210698286895e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6089412005736595e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time_cv", - "family_index": 2, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/2/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1316760527908280e-03, - "cpu_time": 3.9077248961239924e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1315856142834141e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9551, - "real_time": 7.5213892547279727e+04, - "cpu_time": 2.7433647513349610e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3614506114762109e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9551, - "real_time": 7.5291537655092165e+04, - "cpu_time": 2.7424473144173791e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3600466027017634e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9551, - "real_time": 7.5125689708821854e+04, - "cpu_time": 2.7419776285205525e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3630490501570115e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9551, - "real_time": 7.5198531170149319e+04, - "cpu_time": 2.7410739158202906e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3617287253696855e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9551, - "real_time": 7.5454320553748214e+04, - "cpu_time": 2.7421237336404616e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3571124787620032e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5256794327018259e+04, - "cpu_time": 2.7421974687467294e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3606774936933352e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time_median", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5213892547279727e+04, - "cpu_time": 2.7421237336404610e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3614506114762109e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2514720148320457e+02, - "cpu_time": 8.2781478397116643e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2602231142459976e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6629355874420357e-03, - "cpu_time": 3.0188007734888031e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6611012710374107e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9311, - "real_time": 7.4974807966653301e+04, - "cpu_time": 2.7413886628719221e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7315841887996472e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9311, - "real_time": 7.5044883284884345e+04, - "cpu_time": 2.7426807206530450e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7290334934967000e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9311, - "real_time": 7.5261954194968639e+04, - "cpu_time": 2.7447813113521674e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7211624012506858e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9311, - "real_time": 7.5038352846846392e+04, - "cpu_time": 2.7412467737084994e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7292709958332602e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9311, - "real_time": 7.5123794557768357e+04, - "cpu_time": 2.7435537385887362e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7261668717028636e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5088758570224207e+04, - "cpu_time": 2.7427302414348745e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7274435902166314e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time_median", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5044883284884345e+04, - "cpu_time": 2.7426807206530450e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7290334934967000e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1031178826541118e+02, - "cpu_time": 1.4906372139386821e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0029709384874383e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4690852581115165e-03, - "cpu_time": 5.4348662927887763e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4676640619978858e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9282, - "real_time": 7.5258890835269718e+04, - "cpu_time": 2.7467744947208988e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4425463284670547e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9282, - "real_time": 7.5483254655089229e+04, - "cpu_time": 2.7442775856495975e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4263690916828260e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9282, - "real_time": 7.4993768838753545e+04, - "cpu_time": 2.7411857218272012e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4617871103490457e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9282, - "real_time": 7.5261060416557637e+04, - "cpu_time": 2.7449507185951486e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4423894339640066e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9282, - "real_time": 7.5273716461958524e+04, - "cpu_time": 2.7467811387631722e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4414743851129197e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5254138241525739e+04, - "cpu_time": 2.7447939319112041e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4429132699151710e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time_median", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5261060416557637e+04, - "cpu_time": 2.7449507185951492e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.4423894339640066e+07, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.7373857317145377e+02, - "cpu_time": 2.3011951051263196e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2573892850863650e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3086912857050519e-03, - "cpu_time": 8.3838538054621604e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3101402185413873e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9183, - "real_time": 7.6388515552889861e+04, - "cpu_time": 2.7720102471958788e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0724125139371276e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9183, - "real_time": 7.6105587909530674e+04, - "cpu_time": 2.7699398867472162e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0763992796084975e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9183, - "real_time": 7.6046405002489686e+04, - "cpu_time": 2.7694247489927005e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0772369844086385e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9183, - "real_time": 7.5986727591799528e+04, - "cpu_time": 2.7689852488293691e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0780830099708201e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9183, - "real_time": 7.6200860848326411e+04, - "cpu_time": 2.7725170314712101e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0750534716800277e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6145619381007244e+04, - "cpu_time": 2.7705754326472746e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0758370519210222e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time_median", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6105587909530688e+04, - "cpu_time": 2.7699398867472156e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0763992796084975e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5711682144071969e+02, - "cpu_time": 1.5878582133117351e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2170756021728262e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0633730832834863e-03, - "cpu_time": 5.7311495460513127e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0607912677984091e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9015, - "real_time": 7.7535490609447952e+04, - "cpu_time": 2.7946059179145494e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1130968374892253e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9015, - "real_time": 7.7878356874051096e+04, - "cpu_time": 2.7974091713810584e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1037937441973838e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9015, - "real_time": 7.7660210753685911e+04, - "cpu_time": 2.7945113288962707e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1097032625838426e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9015, - "real_time": 7.7597967088010715e+04, - "cpu_time": 2.7942844292844733e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1113955190884647e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9015, - "real_time": 7.7641573822070510e+04, - "cpu_time": 2.7940363693844568e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1102096716311869e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7662719829453257e+04, - "cpu_time": 2.7949694433721626e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1096398069980207e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time_median", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7641573822070524e+04, - "cpu_time": 2.7945113288962713e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1102096716311869e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2974299213617721e+02, - "cpu_time": 1.3814995257213826e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.5191905086255277e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6705955240956256e-03, - "cpu_time": 4.9428072603705745e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6681475657369549e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8736, - "real_time": 7.9659545995277629e+04, - "cpu_time": 2.8410601064561366e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1135057437990612e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8736, - "real_time": 7.9581086440104074e+04, - "cpu_time": 2.8401165762362565e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1175612781640667e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8736, - "real_time": 7.9871436351296550e+04, - "cpu_time": 2.8376949107142410e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1025930541523409e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8736, - "real_time": 7.9906365094707377e+04, - "cpu_time": 2.8375233928571327e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1007997249233401e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8736, - "real_time": 7.9801986875291725e+04, - "cpu_time": 2.8367612557233631e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1061634281371033e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9764084151335468e+04, - "cpu_time": 2.8386312483974261e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1081246458351827e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time_median", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9801986875291725e+04, - "cpu_time": 2.8376949107142410e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1061634281371033e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3930305681562373e+02, - "cpu_time": 1.8511141920381255e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.1781890610376094e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7464383663119063e-03, - "cpu_time": 6.5211506182185090e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7473153031797267e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8222, - "real_time": 8.5215729444221288e+04, - "cpu_time": 2.9270914522014052e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.6905989571910167e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8222, - "real_time": 8.5287774909282089e+04, - "cpu_time": 2.9306485125274782e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.6841024484116948e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8222, - "real_time": 8.5027086251323912e+04, - "cpu_time": 2.9355862819265516e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7076615099202681e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8222, - "real_time": 8.4942084454380922e+04, - "cpu_time": 2.9272745013378514e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7153745897531891e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8222, - "real_time": 8.5305174657506010e+04, - "cpu_time": 2.9302273729020776e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.6825351173738539e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5155569943342853e+04, - "cpu_time": 2.9301656241790729e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.6960545245300055e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time_median", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5215729444221288e+04, - "cpu_time": 2.9302273729020776e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.6905989571910167e+08, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6245230236349656e+02, - "cpu_time": 3.4434593474849919e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4691636553086929e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9077119966618987e-03, - "cpu_time": 1.1751756689350028e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9089829088735752e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7562, - "real_time": 9.5624914734477585e+04, - "cpu_time": 3.0966503834964224e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3706888038953929e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7562, - "real_time": 9.3088596688505117e+04, - "cpu_time": 3.1005374173498777e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4080349759551721e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7562, - "real_time": 9.2516574155783062e+04, - "cpu_time": 3.0855738971171045e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4167407428997078e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7562, - "real_time": 9.5322923234877147e+04, - "cpu_time": 3.0883745305474050e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3750312679462900e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7562, - "real_time": 9.2550661895009456e+04, - "cpu_time": 3.0874162774398772e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4162189369179184e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3820734141730456e+04, - "cpu_time": 3.0917105011901370e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3973429455228963e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time_median", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3088596688505102e+04, - "cpu_time": 3.0883745305474044e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4080349759551721e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5298350984723377e+03, - "cpu_time": 6.5104503184835426e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2666888467330489e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6305938260526606e-02, - "cpu_time": 2.1057761766431170e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6221421190807508e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6149, - "real_time": 1.1386292580699017e+05, - "cpu_time": 3.4474549048626976e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3022770418209882e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6149, - "real_time": 1.1386690716863541e+05, - "cpu_time": 3.4449239404781582e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3021965425983524e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6149, - "real_time": 1.1386485947821775e+05, - "cpu_time": 3.4380769686126994e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3022379441845961e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6149, - "real_time": 1.1388572556625560e+05, - "cpu_time": 3.4429628899007972e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3018161292522283e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6149, - "real_time": 1.1393799398330768e+05, - "cpu_time": 3.4406765896893624e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3007601839857302e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1388368240068131e+05, - "cpu_time": 3.4428190587087430e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3018575683683791e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time_median", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1386690716863540e+05, - "cpu_time": 3.4429628899007972e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3021965425983524e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1703586331152479e+01, - "cpu_time": 3.6407374327030686e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.4060848873551469e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.7838567969385233e-04, - "cpu_time": 1.0574873005578622e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.7830066357650265e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4411, - "real_time": 1.5842414877239263e+05, - "cpu_time": 4.1746662366808759e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3093944582479191e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4411, - "real_time": 1.5862854996508625e+05, - "cpu_time": 4.1774214713217912e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3051301302028828e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4411, - "real_time": 1.5842719783575126e+05, - "cpu_time": 4.1690007776014722e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3093307661955457e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4411, - "real_time": 1.5839603501320840e+05, - "cpu_time": 4.1707573135345348e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3099818436508241e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4411, - "real_time": 1.5811709634408844e+05, - "cpu_time": 4.1679016164135042e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3158210726249638e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5839860558610540e+05, - "cpu_time": 4.1719494831104355e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3099316541844273e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time_median", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5842414877239263e+05, - "cpu_time": 4.1707573135345348e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3093944582479191e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8275560847031778e+02, - "cpu_time": 3.9945200653251260e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.8207344496889599e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1537703112605489e-03, - "cpu_time": 9.5747086140337786e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1543242727863501e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2799, - "real_time": 2.4691723686407204e+05, - "cpu_time": 5.6540773383351916e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2466699097934632e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2799, - "real_time": 2.4994141837713757e+05, - "cpu_time": 5.6575304394426872e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1952870668990111e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2799, - "real_time": 2.4701881003820628e+05, - "cpu_time": 5.6467824330117949e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2449236956400900e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2799, - "real_time": 2.4958002872662080e+05, - "cpu_time": 5.6459011861378921e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2013618050688052e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2799, - "real_time": 2.4706511257919067e+05, - "cpu_time": 5.6489361271884677e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2441281533179016e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4810452131704552e+05, - "cpu_time": 5.6506455048232072e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2264741261438546e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time_median", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4706511257919070e+05, - "cpu_time": 5.6489361271884688e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2441281533179016e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5182306151141570e+03, - "cpu_time": 4.9883279133126450e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5803014849958908e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.1193186123926161e-03, - "cpu_time": 8.8278903871332414e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.1050923488087296e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1636, - "real_time": 4.2757288426016219e+05, - "cpu_time": 8.5247286246948154e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9047824995468168e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1636, - "real_time": 4.2732818558678933e+05, - "cpu_time": 8.5242145721269352e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9075910991461468e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1636, - "real_time": 4.2718157957721851e+05, - "cpu_time": 8.5125981112469709e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9092753532948465e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1636, - "real_time": 4.2722960128884390e+05, - "cpu_time": 8.5168324205382355e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9087235380540609e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1636, - "real_time": 4.2709278338133357e+05, - "cpu_time": 8.5122874022001727e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9102960330929756e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2728100681886950e+05, - "cpu_time": 8.5181322261614283e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9081337046269693e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time_median", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2722960128884402e+05, - "cpu_time": 8.5168324205382378e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9087235380540609e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8396646727102240e+02, - "cpu_time": 6.0618746215126828e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1125769672511341e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.3055147393670221e-04, - "cpu_time": 7.1164363977528665e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3042367922038819e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 867, - "real_time": 8.0566712787520944e+05, - "cpu_time": 1.4705510738177469e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2060011571548939e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 867, - "real_time": 8.0599819123100454e+05, - "cpu_time": 1.4707083713955898e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2038627947713156e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 867, - "real_time": 8.0531002226422064e+05, - "cpu_time": 1.4705216332178980e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2083096994213953e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 867, - "real_time": 8.0563906151070888e+05, - "cpu_time": 1.4711324279122793e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2061825206625080e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 867, - "real_time": 8.0578891629451991e+05, - "cpu_time": 1.4711716366782438e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2052143125619278e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0568066383513273e+05, - "cpu_time": 1.4708170286043517e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2059140969144077e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time_median", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0566712787520944e+05, - "cpu_time": 1.4707083713955900e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2060011571548939e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5091402468197498e+02, - "cpu_time": 3.1425323432473328e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6214253624758681e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1143111153691505e-04, - "cpu_time": 2.1365895839737866e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1145833993628547e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 445, - "real_time": 1.5749198374118698e+06, - "cpu_time": 2.7204448898874545e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3263714131541719e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 445, - "real_time": 1.5682641372314834e+06, - "cpu_time": 2.7192282516853595e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3489764898971233e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 445, - "real_time": 1.5752578253617112e+06, - "cpu_time": 2.7211733123596297e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3252285847707529e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 445, - "real_time": 1.5692248822744477e+06, - "cpu_time": 2.7203975235955040e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3457016229831142e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 445, - "real_time": 1.5748788576489419e+06, - "cpu_time": 2.7206113573034662e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3265100101241655e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5725091079856909e+06, - "cpu_time": 2.7203710669662831e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3345576241858654e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time_median", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5748788576489419e+06, - "cpu_time": 2.7204448898874545e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3265100101241655e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.4564682940122584e+03, - "cpu_time": 7.0949165828184323e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1735645669797637e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1980593158152381e-03, - "cpu_time": 2.6080694170632304e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1999285595098758e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 220, - "real_time": 3.1770056843842296e+06, - "cpu_time": 5.3455667090908969e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2808265601991758e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 220, - "real_time": 3.1800143960440024e+06, - "cpu_time": 5.3495230318183284e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2758302040617085e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 220, - "real_time": 3.1781176941215317e+06, - "cpu_time": 5.3471278545456156e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2789788216567030e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 220, - "real_time": 3.1743656346489759e+06, - "cpu_time": 5.3414116818177346e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2852185069270506e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 220, - "real_time": 3.1790100270882249e+06, - "cpu_time": 5.3495945818181923e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2774970374556780e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1777026872573933e+06, - "cpu_time": 5.3466447718181545e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2796702260600634e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time_median", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1781176941215312e+06, - "cpu_time": 5.3471278545456165e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2789788216567030e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1706622703028706e+03, - "cpu_time": 3.3825500273430312e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.6078763466172176e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.8309168098300689e-04, - "cpu_time": 6.3264910456970142e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8335259441186416e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 102, - "real_time": 6.9069803473265730e+06, - "cpu_time": 1.1297495019607818e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.8580465431594334e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 102, - "real_time": 7.1055654792443793e+06, - "cpu_time": 1.1931281529412303e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7222746870764532e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 102, - "real_time": 7.1135969129482321e+06, - "cpu_time": 1.1925103450981205e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7169431176124029e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 102, - "real_time": 7.0308465191035299e+06, - "cpu_time": 1.1667667127450805e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7724597470346098e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 102, - "real_time": 6.9537759785923883e+06, - "cpu_time": 1.1412094862745402e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.8253541821449680e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0221530474430202e+06, - "cpu_time": 1.1646728398039509e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7790156554055738e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time_median", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.0308465191035299e+06, - "cpu_time": 1.1667667127450805e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.7724597470346098e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.1289875073610368e+04, - "cpu_time": 2.8979235391878884e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.2266880540804997e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.3000268501247176e-02, - "cpu_time": 2.4881867595329996e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3029227152745262e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50, - "real_time": 1.4371413476765156e+07, - "cpu_time": 2.3711329000000205e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6696077674264688e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50, - "real_time": 1.4310549031943083e+07, - "cpu_time": 2.3568100979998689e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6894681573854313e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50, - "real_time": 1.4315169826149940e+07, - "cpu_time": 2.3561119880000662e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6879544437824459e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50, - "real_time": 1.4338939692825079e+07, - "cpu_time": 2.3625259600000843e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6801831542383814e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50, - "real_time": 1.4379909615963697e+07, - "cpu_time": 2.3742721679998342e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6668488044945593e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4343196328729395e+07, - "cpu_time": 2.3641706227999747e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6788124654654579e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time_median", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4338939692825079e+07, - "cpu_time": 2.3625259600000847e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.6801831542383814e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.1676184611617275e+04, - "cpu_time": 8.2513386055530544e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0330222351759907e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2084467008354294e-03, - "cpu_time": 3.4901620576693777e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2078727087285030e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.6921875631579988e+07, - "cpu_time": 4.3262403269230053e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9854523450275316e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.6888331183447286e+07, - "cpu_time": 4.3265659730768494e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 4.9916719295180988e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.6643029987238921e+07, - "cpu_time": 4.3310815615383871e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0376300317300844e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.6807702433031339e+07, - "cpu_time": 4.3295899576920554e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0066852366513319e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.6738797242824849e+07, - "cpu_time": 4.3339647730769791e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0195873352536936e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6799947295624476e+07, - "cpu_time": 4.3294885184614561e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0082053756361485e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time_median", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6807702433031339e+07, - "cpu_time": 4.3295899576920561e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0066852366513319e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1302736783624697e+05, - "cpu_time": 3.2278844208624614e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1146663187799629e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.2174473923200775e-03, - "cpu_time": 7.4555791223336815e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.2224033564345499e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 16, - "real_time": 4.3017422547563910e+07, - "cpu_time": 8.1474019562499225e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.2401566645047998e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 16, - "real_time": 4.3008811771869659e+07, - "cpu_time": 8.1446574999993965e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.2414060035848951e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 16, - "real_time": 4.3006013380363584e+07, - "cpu_time": 8.1527155437498778e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.2418121304535246e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 16, - "real_time": 4.3025172315537930e+07, - "cpu_time": 8.1481115937499732e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.2390326767630014e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 16, - "real_time": 4.2943371925503016e+07, - "cpu_time": 8.1486710749999240e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.2509170557373667e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3000158388167620e+07, - "cpu_time": 8.1483115337498188e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.2426649062087173e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time_median", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.3008811771869659e+07, - "cpu_time": 8.1481115937499732e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 6.2414060035848951e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2625189993348329e+04, - "cpu_time": 2.9044725819412801e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7406329058639416e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.5872255396914581e-04, - "cpu_time": 3.5645085118691508e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5939249937139635e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 9.2747760936617851e+07, - "cpu_time": 1.5140305525000030e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7885053674437265e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 9.2776619829237461e+07, - "cpu_time": 1.5129814837500533e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7867048076137333e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 9.2745499685406685e+07, - "cpu_time": 1.5139755999999237e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7886464984400263e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 9.2816980555653572e+07, - "cpu_time": 1.5130108025000766e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7841885050127144e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 9.2949240468442440e+07, - "cpu_time": 1.5167432274999726e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7759580314405594e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2807220295071602e+07, - "cpu_time": 1.5141483332500061e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7848006419901524e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time_median", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2776619829237461e+07, - "cpu_time": 1.5139755999999237e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.7867048076137333e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4478147776588768e+04, - "cpu_time": 1.5356349833642165e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.2608916128276205e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.1025404605373005e-04, - "cpu_time": 1.0141905846622642e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.0943352042944549e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8595119938254356e+08, - "cpu_time": 2.8156681125000203e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7743205075600014e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8656904250383377e+08, - "cpu_time": 2.8260201250000703e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7551982343369532e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8656812608242035e+08, - "cpu_time": 2.8246645350000674e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7552265038329868e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8610732257366180e+08, - "cpu_time": 2.8185950249999791e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7694764996418123e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8621900677680969e+08, - "cpu_time": 2.8192582174997938e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7660162761308193e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time_mean", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8628293946385387e+08, - "cpu_time": 2.8208412029999864e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7640476043005142e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time_median", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8621900677680969e+08, - "cpu_time": 2.8192582174997938e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.7660162761308193e+09, - "hip_id": 3.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time_stddev", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7756373997894325e+05, - "cpu_time": 4.3517561020075966e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5878442729057446e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time_cv", - "family_index": 3, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/3/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4900115962192095e-03, - "cpu_time": 1.5427157322359978e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4898982212600770e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9015, - "real_time": 7.7362615567575471e+04, - "cpu_time": 2.7961024004436290e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3236367365391703e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9015, - "real_time": 7.7254123510969759e+04, - "cpu_time": 2.7941708973932732e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3254955897009125e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9015, - "real_time": 7.7393746579096143e+04, - "cpu_time": 2.7956084093178360e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3231043143175341e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9015, - "real_time": 7.7339282778920257e+04, - "cpu_time": 2.7965451735995122e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3240360696480410e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9015, - "real_time": 7.7319897091944906e+04, - "cpu_time": 2.8015313843593263e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3243680326970831e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7333933105701319e+04, - "cpu_time": 2.7967916530227161e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3241281485805482e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time_median", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7339282778920271e+04, - "cpu_time": 2.7961024004436296e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3240360696480410e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.2429799053870553e+01, - "cpu_time": 2.7959479658136235e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.9800341469979940e+03, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 6.7796628140209326e-04, - "cpu_time": 9.9969833748317274e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.7818467242951514e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9138, - "real_time": 7.7511673859869872e+04, - "cpu_time": 2.8023705044867692e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6421826519996125e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9138, - "real_time": 7.7485256136519529e+04, - "cpu_time": 2.8003935095206776e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6430834743472680e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9138, - "real_time": 7.7333483637860816e+04, - "cpu_time": 2.7984116447801370e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6482707149084684e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9138, - "real_time": 7.7351479273860488e+04, - "cpu_time": 2.7998765222149005e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6476546010828316e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9138, - "real_time": 7.7348519179733426e+04, - "cpu_time": 2.7991797647187259e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6477559256707910e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7406082417568832e+04, - "cpu_time": 2.8000463891442423e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6457894736017942e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time_median", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7351479273860488e+04, - "cpu_time": 2.7998765222149005e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.6476546010828316e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.5122915436167716e+01, - "cpu_time": 1.4978556752302083e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.9083408811984198e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.0996928507112690e-03, - "cpu_time": 5.3493959280009895e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0992336730553268e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9116, - "real_time": 7.7158126017507224e+04, - "cpu_time": 2.8007515072400711e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.3085789033686675e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9116, - "real_time": 7.7188033556339913e+04, - "cpu_time": 2.8014589940763765e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.3065220232749030e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9116, - "real_time": 7.7394447316991398e+04, - "cpu_time": 2.8004291761737346e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2923693391383030e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9116, - "real_time": 7.7316690641734007e+04, - "cpu_time": 2.7971990982887626e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2976918256626226e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9116, - "real_time": 7.7287098355554524e+04, - "cpu_time": 2.7977130210617639e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2997202471706279e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7268879177625437e+04, - "cpu_time": 2.7995103593681415e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.3009764677230246e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time_median", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7287098355554524e+04, - "cpu_time": 2.8004291761737352e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.2997202471706279e+07, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6420315704793637e+01, - "cpu_time": 1.9205599678757829e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6143752572521917e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2478544626374475e-03, - "cpu_time": 6.8603424218414370e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2477654442584845e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9074, - "real_time": 7.7725708245404239e+04, - "cpu_time": 2.8202797575490142e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0539627344578588e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9074, - "real_time": 7.7859137575426401e+04, - "cpu_time": 2.8221438968481199e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0521565297411576e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9074, - "real_time": 7.7715238471154604e+04, - "cpu_time": 2.8176804981265136e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0541047240099001e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9074, - "real_time": 7.7741264444046901e+04, - "cpu_time": 2.8176857780470827e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0537518341878872e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9074, - "real_time": 7.7988178347545982e+04, - "cpu_time": 2.8210437194181210e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0504156108754364e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7805905416715628e+04, - "cpu_time": 2.8197667299977702e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0528782866544481e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time_median", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.7741264444046916e+04, - "cpu_time": 2.8202797575490142e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0537518341878872e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1714053598199548e+02, - "cpu_time": 2.0141714130981990e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5834271337829222e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5055481374403399e-03, - "cpu_time": 7.1430426909810081e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5039033037848172e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8716, - "real_time": 7.9684315114476543e+04, - "cpu_time": 2.8523924242771446e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0561135496317342e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8716, - "real_time": 7.9663877610685435e+04, - "cpu_time": 2.8524882801745000e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0566410387488329e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8716, - "real_time": 7.9502316095478716e+04, - "cpu_time": 2.8501688916933810e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0608204646923181e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8716, - "real_time": 7.9386849745181855e+04, - "cpu_time": 2.8514000114731072e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0638178807434511e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8716, - "real_time": 7.9443075165940638e+04, - "cpu_time": 2.8499279256539245e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0623572244373864e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9536086746352637e+04, - "cpu_time": 2.8512755066544120e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0599500316507447e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time_median", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9502316095478716e+04, - "cpu_time": 2.8514000114731066e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0608204646923181e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3263243154899035e+02, - "cpu_time": 1.2014987774571925e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4344037220455025e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6675755242015673e-03, - "cpu_time": 4.2138992694781352e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6672267138894321e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8441, - "real_time": 8.2085334821090029e+04, - "cpu_time": 2.8957831548394921e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9919432711604136e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8441, - "real_time": 8.2143984897463917e+04, - "cpu_time": 2.8977664328871056e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9890930590843141e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8441, - "real_time": 8.2079557057364931e+04, - "cpu_time": 2.8961201753347123e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9922242729817158e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8441, - "real_time": 8.2225881197256778e+04, - "cpu_time": 2.8956002701102104e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9851199552840072e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8441, - "real_time": 8.2201885785523540e+04, - "cpu_time": 2.8932827840303775e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9862832448268145e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2147328751739842e+04, - "cpu_time": 2.8957105634403799e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9889327606674528e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time_median", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2143984897463903e+04, - "cpu_time": 2.8957831548394926e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.9890930590843141e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.6321919427625119e+01, - "cpu_time": 1.6051423678556924e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.2202616906083893e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.0735333011325023e-04, - "cpu_time": 5.5431726779648532e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.0729906564520665e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7836, - "real_time": 8.8688671075524864e+04, - "cpu_time": 2.9939864229197567e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3894443569000292e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7836, - "real_time": 8.8674069093054204e+04, - "cpu_time": 2.9921063910158206e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3906611786616886e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7836, - "real_time": 8.8733631265959091e+04, - "cpu_time": 2.9993084137314494e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3857002204238188e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7836, - "real_time": 8.8700981270626464e+04, - "cpu_time": 2.9907412633997132e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3884188270758617e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7836, - "real_time": 8.8706349813110268e+04, - "cpu_time": 2.9918909660540766e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3879716771204770e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8700740503654975e+04, - "cpu_time": 2.9936066914241633e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3884392520363760e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time_median", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.8700981270626449e+04, - "cpu_time": 2.9921063910158206e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.3884188270758617e+08, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2194367543825887e+01, - "cpu_time": 3.3933437009812303e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8485488427412460e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5021625995232084e-04, - "cpu_time": 1.1335302365211169e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5019476775582275e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7146, - "real_time": 9.8003331283784777e+04, - "cpu_time": 3.1602160635320115e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3374239251159682e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7146, - "real_time": 1.0001559941070367e+05, - "cpu_time": 3.1620324601175857e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3105155672943223e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7146, - "real_time": 9.7968540130702269e+04, - "cpu_time": 3.1658422879932815e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3378988788149092e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7146, - "real_time": 9.7755563400532061e+04, - "cpu_time": 3.1566256717044982e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3408137137214494e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7146, - "real_time": 9.9944553700327000e+04, - "cpu_time": 3.1586792625245819e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3114471489162412e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8737517585209949e+04, - "cpu_time": 3.1606791491743922e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3276198467725782e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time_median", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.8003331283784792e+04, - "cpu_time": 3.1602160635320109e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3374239251159682e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1385318624662823e+03, - "cpu_time": 3.5047869935558913e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5247697444007734e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1530894135390178e-02, - "cpu_time": 1.1088714887341174e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1484987574624341e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6059, - "real_time": 1.1537137717456037e+05, - "cpu_time": 3.4822754563459498e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2721753559669156e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6059, - "real_time": 1.1544505176931965e+05, - "cpu_time": 3.4837973593002831e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2707253016249819e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6059, - "real_time": 1.1537269357770208e+05, - "cpu_time": 3.4785612196731160e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2721494304321609e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6059, - "real_time": 1.1516251035783527e+05, - "cpu_time": 3.4725935005774646e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2762963327688923e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6059, - "real_time": 1.1517970947875416e+05, - "cpu_time": 3.4766839527973585e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2759564265818415e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1530626847163432e+05, - "cpu_time": 3.4787822977388342e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2734605694749589e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time_median", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1537137717456036e+05, - "cpu_time": 3.4785612196731160e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2721753559669156e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2707853435878664e+02, - "cpu_time": 4.4751015857940837e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5061626898188395e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.1020956279584083e-03, - "cpu_time": 1.2863988610908033e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1023559077594303e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4382, - "real_time": 1.5944017329201609e+05, - "cpu_time": 4.2048281857602898e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2883055077954655e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4382, - "real_time": 1.5933275485948144e+05, - "cpu_time": 4.2032319169326581e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2905224067855940e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4382, - "real_time": 1.5937876244306623e+05, - "cpu_time": 4.2041344796897628e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2895725375411158e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4382, - "real_time": 1.5948501482950454e+05, - "cpu_time": 4.2097253879507130e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2873809527527313e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4382, - "real_time": 1.5937113303198389e+05, - "cpu_time": 4.2094609356457496e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2897300158792348e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5940156769121045e+05, - "cpu_time": 4.2062761811958347e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2891022841508284e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time_median", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5937876244306620e+05, - "cpu_time": 4.2048281857602904e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2895725375411158e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.0488368574764749e+01, - "cpu_time": 3.0818342416845314e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2479751618041121e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.7947160401798319e-04, - "cpu_time": 7.3267519985061285e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.7942728866101864e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2795, - "real_time": 2.4803616338716034e+05, - "cpu_time": 5.6801190983903664e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2275125759112582e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2795, - "real_time": 2.5000300675743859e+05, - "cpu_time": 5.6804632450801879e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1942535555876894e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2795, - "real_time": 2.4790781402663860e+05, - "cpu_time": 5.6740105509836506e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2297012868151326e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2795, - "real_time": 2.4997883955098368e+05, - "cpu_time": 5.6803260250450938e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1946590434753213e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2795, - "real_time": 2.4790672274233110e+05, - "cpu_time": 5.6795278926655231e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2297199059416685e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4876650929291049e+05, - "cpu_time": 5.6788893624329648e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2151692735462136e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time_median", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4803616338716037e+05, - "cpu_time": 5.6801190983903664e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2275125759112582e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1190024853976104e+03, - "cpu_time": 2.7506307721743053e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8930096548503920e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.4982039124890376e-03, - "cpu_time": 4.8436069037905555e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4909457533073320e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1634, - "real_time": 4.2859671814888692e+05, - "cpu_time": 8.5595565055083891e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8930659316702614e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1634, - "real_time": 4.2855372299246991e+05, - "cpu_time": 8.5619150795598514e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8935568342661419e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1634, - "real_time": 4.2837991409765778e+05, - "cpu_time": 8.5590475459001353e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8955423234944487e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1634, - "real_time": 4.2842956163451378e+05, - "cpu_time": 8.5586376866574702e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8949750152606087e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1634, - "real_time": 4.2864860928115284e+05, - "cpu_time": 8.5628269155453367e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8924735893041649e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2852170523093629e+05, - "cpu_time": 8.5603967466342391e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8939227387991247e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time_median", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2855372299246991e+05, - "cpu_time": 8.5595565055083891e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8935568342661419e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1330476641351727e+02, - "cpu_time": 1.8595493738310603e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2940613569379158e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6440846526655108e-04, - "cpu_time": 2.1722700814798040e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6442210594756013e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 864, - "real_time": 8.0888867631545977e+05, - "cpu_time": 1.4787291909720404e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1852672967376995e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 864, - "real_time": 8.0864498300393776e+05, - "cpu_time": 1.4779259212963430e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1868299292714157e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 864, - "real_time": 8.0833682356266456e+05, - "cpu_time": 1.4780234525462505e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1888072864403477e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 864, - "real_time": 8.0829071339394432e+05, - "cpu_time": 1.4776796296297756e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1891032898157053e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 864, - "real_time": 8.0837867062655289e+05, - "cpu_time": 1.4776208807868822e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1885386792171383e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0850797338051186e+05, - "cpu_time": 1.4779958150462583e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1877092962964621e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time_median", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0837867062655278e+05, - "cpu_time": 1.4779259212963430e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1885386792171383e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5343624672296943e+02, - "cpu_time": 4.4272963897675919e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6258324400749297e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.1346165414214601e-04, - "cpu_time": 2.9954728861184400e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1340083786800114e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 443, - "real_time": 1.5709607795713381e+06, - "cpu_time": 2.7251961331827510e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3397946715696917e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 443, - "real_time": 1.5747354591357822e+06, - "cpu_time": 2.7259582460496230e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3269950526189861e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 443, - "real_time": 1.5709362256616084e+06, - "cpu_time": 2.7251506636572401e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3398781331604290e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 443, - "real_time": 1.5746252892463224e+06, - "cpu_time": 2.7260212279905695e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3273677599926767e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 443, - "real_time": 1.5714530592351209e+06, - "cpu_time": 2.7263531422118405e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3381219061567240e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5725421625700346e+06, - "cpu_time": 2.7257358826184049e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3344315046997023e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time_median", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5714530592351211e+06, - "cpu_time": 2.7259582460496230e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3381219061567240e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.9631555078462566e+03, - "cpu_time": 5.3518398136299697e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.6566825853844043e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2483961031848172e-03, - "cpu_time": 1.9634476868275546e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2478710392137911e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 217, - "real_time": 3.2241002426907625e+06, - "cpu_time": 5.3961073179721627e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2036893201552896e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 217, - "real_time": 3.2250085869194586e+06, - "cpu_time": 5.3971967327183234e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2022236678835220e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 217, - "real_time": 3.2232146879683854e+06, - "cpu_time": 5.3946867281102901e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2051189958354263e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 217, - "real_time": 3.2211390650114431e+06, - "cpu_time": 5.3926539723503627e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2084730467668896e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 217, - "real_time": 3.2235110674293772e+06, - "cpu_time": 5.3953291290322701e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2046404212842264e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2233947300038859e+06, - "cpu_time": 5.3951947760366816e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2048290903850708e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time_median", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2235110674293772e+06, - "cpu_time": 5.3953291290322701e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2046404212842264e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4349439338259269e+03, - "cpu_time": 1.7009122650328743e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3176152565600700e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.4516544017064800e-04, - "cpu_time": 3.1526429269757836e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4528172132326539e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 105, - "real_time": 6.7514337599277496e+06, - "cpu_time": 1.0892355571429236e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9699712969351683e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 105, - "real_time": 6.7571068670423254e+06, - "cpu_time": 1.0894403314285316e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9657986265780659e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 105, - "real_time": 6.7529575367059028e+06, - "cpu_time": 1.0886024171430195e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9688498435854044e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 105, - "real_time": 6.7508973536037263e+06, - "cpu_time": 1.0889326457143918e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9703661961454887e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 105, - "real_time": 6.7501735474382127e+06, - "cpu_time": 1.0884577923811127e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9708991575089779e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7525138129435834e+06, - "cpu_time": 1.0889337487619959e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9691770241506214e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time_median", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.7514337599277496e+06, - "cpu_time": 1.0889326457143916e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9699712969351683e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7635726262265498e+03, - "cpu_time": 4.1353072167589817e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0329387513449588e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0926574943529688e-04, - "cpu_time": 3.7975746655481978e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0910974623457853e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 51, - "real_time": 1.3995977009043975e+07, - "cpu_time": 2.2732559588237066e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7948681222207880e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 51, - "real_time": 1.4020977943551308e+07, - "cpu_time": 2.2811074921567827e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7863183488470926e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 51, - "real_time": 1.3970916342063278e+07, - "cpu_time": 2.2718445294119600e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.8034690321600704e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 51, - "real_time": 1.4011377925235851e+07, - "cpu_time": 2.2773468882352222e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7895977367886438e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 51, - "real_time": 1.4022938779317865e+07, - "cpu_time": 2.2796713431373563e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7856490751408997e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4004437599842453e+07, - "cpu_time": 2.2766452423530061e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7919804630314989e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time_median", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4011377925235853e+07, - "cpu_time": 2.2773468882352225e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7895977367886438e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1559806635222329e+04, - "cpu_time": 4.0029786969434666e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3849372073484827e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5394982113001716e-03, - "cpu_time": 1.7582795169291394e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5411033630710234e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 31, - "real_time": 2.2710633013517626e+07, - "cpu_time": 4.2304367645160265e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.9099069550422525e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 31, - "real_time": 2.2522440300353114e+07, - "cpu_time": 4.2087731354836099e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.9592888785632925e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 31, - "real_time": 2.2675262043072332e+07, - "cpu_time": 4.2273408967745245e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.9191257743813257e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 31, - "real_time": 2.2639406424376272e+07, - "cpu_time": 4.2275796645159766e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.9285003097733717e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 31, - "real_time": 2.2703696102384597e+07, - "cpu_time": 4.2306490645160012e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.9117126742153206e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2650287576740790e+07, - "cpu_time": 4.2249559051612273e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.9257069183951130e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time_median", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2675262043072332e+07, - "cpu_time": 4.2275796645159766e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.9191257743813257e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6780680962959683e+04, - "cpu_time": 9.1775025915832972e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0151552376640368e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.3898325000431572e-03, - "cpu_time": 2.1722126331240551e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.4007001450044897e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 15, - "real_time": 4.8211543510357536e+07, - "cpu_time": 7.8690364466668442e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.5678668728440647e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 15, - "real_time": 4.8127627372741699e+07, - "cpu_time": 7.8660490400003865e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.5775750988305569e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 15, - "real_time": 4.8118165632088982e+07, - "cpu_time": 7.8600270133332148e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.5786718482257795e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 15, - "real_time": 4.8187468945980072e+07, - "cpu_time": 7.8680159333331779e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.5706485912535896e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 15, - "real_time": 4.8188418149948120e+07, - "cpu_time": 7.8607838399996892e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.5705388619462080e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8166644722223282e+07, - "cpu_time": 7.8647824546666607e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.5730602546200409e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time_median", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.8187468945980072e+07, - "cpu_time": 7.8660490400003865e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.5706485912535896e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1219556538068005e+04, - "cpu_time": 4.1460587354484363e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.7701822946801521e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.5576972977422254e-04, - "cpu_time": 5.2716763106248703e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5593589100812128e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8, - "real_time": 9.5696569420397282e+07, - "cpu_time": 1.5219337737499928e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6101374924059553e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8, - "real_time": 9.5662770792841911e+07, - "cpu_time": 1.5229740637499845e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6121196109048100e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8, - "real_time": 9.5471829175949097e+07, - "cpu_time": 1.5184150625000826e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6233437301235504e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8, - "real_time": 9.5622089691460133e+07, - "cpu_time": 1.5228369062501201e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6145072099166555e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8, - "real_time": 9.5692129805684090e+07, - "cpu_time": 1.5230681137498435e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6103977734656916e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5629077777266502e+07, - "cpu_time": 1.5218455840000048e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6141011633633327e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time_median", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.5662770792841911e+07, - "cpu_time": 1.5228369062501201e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.6121196109048100e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2792585138439084e+04, - "cpu_time": 1.9702170268881929e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.4530323772081165e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.7033859674529115e-04, - "cpu_time": 1.2946234805962984e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.7130996013995545e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.8888075649738312e+08, - "cpu_time": 2.8117600350003612e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6847602895686007e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.8893163651227951e+08, - "cpu_time": 2.8123227124996221e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6832293618025837e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.8859283998608589e+08, - "cpu_time": 2.8124326925001240e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6934389666077414e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.8940332159399986e+08, - "cpu_time": 2.8218334275004506e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6690759959407978e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.8916628137230873e+08, - "cpu_time": 2.8198113575001574e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6761797938328590e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time_mean", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8899496719241142e+08, - "cpu_time": 2.8156320450001431e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6813368815505171e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time_median", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8893163651227951e+08, - "cpu_time": 2.8124326925001240e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 5.6832293618025837e+09, - "hip_id": 4.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time_stddev", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.0613028822608985e+05, - "cpu_time": 4.7985361660058907e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.2017190833539367e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time_cv", - "family_index": 4, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/4/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6197801072365364e-03, - "cpu_time": 1.7042483141669338e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6196397564867968e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9430, - "real_time": 7.4131403252224889e+04, - "cpu_time": 2.7463859268294362e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3813309273479413e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9430, - "real_time": 7.4016262266150618e+04, - "cpu_time": 2.7429431187696807e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3834797497850677e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9430, - "real_time": 7.4198814377630391e+04, - "cpu_time": 2.7451275143159245e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3800759602281699e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9430, - "real_time": 7.4321437334310467e+04, - "cpu_time": 2.7501147433721949e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3777989725815902e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9430, - "real_time": 7.4104255385124576e+04, - "cpu_time": 2.7479711834569043e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3818369737044200e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4154434523088188e+04, - "cpu_time": 2.7465084973488282e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3809045167294377e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time_median", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4131403252224889e+04, - "cpu_time": 2.7463859268294368e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.3813309273479413e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1401695965027140e+02, - "cpu_time": 2.7284850701886791e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1221473587169614e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5375609076321913e-03, - "cpu_time": 9.9343769473950400e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5367806629694415e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9563, - "real_time": 7.4206926370552144e+04, - "cpu_time": 2.7463953529228334e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7598501921145692e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9563, - "real_time": 7.4412321954262981e+04, - "cpu_time": 2.7473657858412626e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7522323537475269e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9563, - "real_time": 7.4181377112826827e+04, - "cpu_time": 2.7477813792742859e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7608007288474519e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9563, - "real_time": 7.4051294075431273e+04, - "cpu_time": 2.7461979838963045e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7656505204538818e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9563, - "real_time": 7.4423664940886709e+04, - "cpu_time": 2.7518980968316080e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7518128832095101e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4255116890791993e+04, - "cpu_time": 2.7479277197532589e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7580693356745884e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time_median", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4206926370552130e+04, - "cpu_time": 2.7473657858412631e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.7598501921145692e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6001991932352402e+02, - "cpu_time": 2.3152329059347227e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.9439018424348156e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1550019180343826e-03, - "cpu_time": 8.4253777466265062e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1550951477371087e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9532, - "real_time": 7.4466443511040066e+04, - "cpu_time": 2.7550964393620490e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.5004641109156035e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9532, - "real_time": 7.4380819315156579e+04, - "cpu_time": 2.7510800451111922e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.5067960231050558e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9532, - "real_time": 7.4127892222387076e+04, - "cpu_time": 2.7481128902643564e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.5255854135334268e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9532, - "real_time": 7.4118660248141998e+04, - "cpu_time": 2.7492183508183016e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.5262736621074833e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9532, - "real_time": 7.4314580998459729e+04, - "cpu_time": 2.7497692719262087e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.5117043586438246e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4281679259037090e+04, - "cpu_time": 2.7506553994964215e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.5141647136610799e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time_median", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.4314580998459729e+04, - "cpu_time": 2.7497692719262082e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.5117043586438246e+07, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5433304454305281e+02, - "cpu_time": 2.7026765971710120e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1457710077716227e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0776730693561518e-03, - "cpu_time": 9.8255731985395431e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0778686660067112e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9396, - "real_time": 7.5050474547883350e+04, - "cpu_time": 2.7712085057470755e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0915320721620993e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9396, - "real_time": 7.5382501606558581e+04, - "cpu_time": 2.7745953724988160e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0867243492072256e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9396, - "real_time": 7.5208277193125527e+04, - "cpu_time": 2.7712975287357101e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0892418103081873e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9396, - "real_time": 7.5023742365215599e+04, - "cpu_time": 2.7715121062153857e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0919210028368542e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9396, - "real_time": 7.5000819605558849e+04, - "cpu_time": 2.7694269082588016e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0922547304260169e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5133163063668384e+04, - "cpu_time": 2.7716080842911580e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0903347929880768e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time_median", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.5050474547883350e+04, - "cpu_time": 2.7712975287357101e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0915320721620993e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6135125674404975e+02, - "cpu_time": 1.8672666707624040e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3380341262479467e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.1475371216212410e-03, - "cpu_time": 6.7371237706573489e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.1443268079527514e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9030, - "real_time": 7.6710085437179543e+04, - "cpu_time": 2.8000450808417075e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1358338876336417e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9030, - "real_time": 7.6666321751092022e+04, - "cpu_time": 2.8001684330009919e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1370530926464629e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9030, - "real_time": 7.6618353717760343e+04, - "cpu_time": 2.7983959999999712e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1383910257787418e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9030, - "real_time": 7.6438806939797665e+04, - "cpu_time": 2.7972008781839418e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1434138830690873e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9030, - "real_time": 7.6476338989770971e+04, - "cpu_time": 2.7979721395348397e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1423619666458446e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6581981367120112e+04, - "cpu_time": 2.7987565063122904e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1394107711547557e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time_median", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.6618353717760328e+04, - "cpu_time": 2.7983959999999718e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.1383910257787418e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1885508987269618e+02, - "cpu_time": 1.3056737918903093e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3214110003129696e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5519981038741536e-03, - "cpu_time": 4.6651925201263633e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5524886782355613e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8952, - "real_time": 7.8926509139704634e+04, - "cpu_time": 2.8436951988383784e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1517102881110173e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8952, - "real_time": 7.8889710743489646e+04, - "cpu_time": 2.8431595844503382e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1536468686702812e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8952, - "real_time": 7.8910225784707043e+04, - "cpu_time": 2.8441343621537549e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1525670056250817e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8952, - "real_time": 7.8954211893166910e+04, - "cpu_time": 2.8423951407505921e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1502535728351569e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8952, - "real_time": 7.8908012524880003e+04, - "cpu_time": 2.8434721235479729e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1526834793447775e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8917734017189665e+04, - "cpu_time": 2.8433712819482078e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1521722429172635e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time_median", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.8910225784707029e+04, - "cpu_time": 2.8434721235479729e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 4.1525670056250817e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4206523118148258e+01, - "cpu_time": 6.5097043549226115e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2734224059596250e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0673109687710565e-04, - "cpu_time": 2.2894317025184003e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0668824207180157e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8219, - "real_time": 8.4251423352324040e+04, - "cpu_time": 2.9357600365009438e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7786222941232026e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8219, - "real_time": 8.4223953132370734e+04, - "cpu_time": 2.9359273695096275e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7811593451331151e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8219, - "real_time": 8.4332350544549437e+04, - "cpu_time": 2.9307992079327034e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7711577558104384e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8219, - "real_time": 8.4207001008062027e+04, - "cpu_time": 2.9361029018127837e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7827258084782696e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8219, - "real_time": 8.4353974868516190e+04, - "cpu_time": 2.9366995279231516e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7691656027059722e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4273740581164486e+04, - "cpu_time": 2.9350578087358421e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7765661612502003e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time_median", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4251423352324040e+04, - "cpu_time": 2.9359273695096275e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.7786222941232026e+08, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.5771741762524357e+01, - "cpu_time": 2.4068860591617130e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.0680596305573662e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8045357081520832e-04, - "cpu_time": 8.2004724131767013e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8030065002132436e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7336, - "real_time": 9.5096494603131883e+04, - "cpu_time": 3.0920485305344150e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3783052734699152e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7336, - "real_time": 9.2613309000664725e+04, - "cpu_time": 3.0908862009270990e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4152609534668419e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7336, - "real_time": 9.4887698607651560e+04, - "cpu_time": 3.0895154048527300e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3813381705247788e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7336, - "real_time": 9.2536850662310346e+04, - "cpu_time": 3.0899279021262529e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4164303092431130e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7336, - "real_time": 9.2436062684101751e+04, - "cpu_time": 3.0885320651584107e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4179747188922977e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.3514083111572065e+04, - "cpu_time": 3.0901820207197819e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4018618851193895e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time_median", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.2613309000664711e+04, - "cpu_time": 3.0899279021262529e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.4152609534668419e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3527149515417300e+03, - "cpu_time": 1.3426685159138907e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0171354933322649e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4465360794136217e-02, - "cpu_time": 4.3449496078588575e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4388974511283440e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6095, - "real_time": 1.1387341791879266e+05, - "cpu_time": 3.4364054126331903e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3020649137531338e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6095, - "real_time": 1.1354598417956270e+05, - "cpu_time": 3.4339715668579348e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3087034023628960e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6095, - "real_time": 1.1358365629827550e+05, - "cpu_time": 3.4351716833470378e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3079376782131290e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6095, - "real_time": 1.1355246969122802e+05, - "cpu_time": 3.4335596242824115e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3085715415333738e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6095, - "real_time": 1.1354404303166554e+05, - "cpu_time": 3.4339803494666400e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3087428719346590e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1361991422390488e+05, - "cpu_time": 3.4346177273174434e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3072040815594382e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time_median", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1355246969122805e+05, - "cpu_time": 3.4339803494666406e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.3085715415333738e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4260926929560898e+02, - "cpu_time": 1.1668378169410953e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.8911500854573427e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.2551432578498192e-03, - "cpu_time": 3.3972858395872678e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2530968146966938e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4453, - "real_time": 1.5757481509510826e+05, - "cpu_time": 4.1631037031216943e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3272322082913618e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4453, - "real_time": 1.5778575909944941e+05, - "cpu_time": 4.1655520480573660e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3227840268496671e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4453, - "real_time": 1.5771968512021087e+05, - "cpu_time": 4.1638064024250832e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3241760506965117e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4453, - "real_time": 1.5790224385740812e+05, - "cpu_time": 4.1655514731639886e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3203328033352871e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4453, - "real_time": 1.5782212409378123e+05, - "cpu_time": 4.1630090545698005e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3220183989442253e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5776092545319159e+05, - "cpu_time": 4.1642045362675871e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3233086976234112e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time_median", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5778575909944944e+05, - "cpu_time": 4.1638064024250838e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.3227840268496671e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2315712058746423e+02, - "cpu_time": 1.2678276403541035e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5953002826493895e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.8065668183472682e-04, - "cpu_time": 3.0445854167635787e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.8093867250591544e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2814, - "real_time": 2.4633521223270320e+05, - "cpu_time": 5.6399166524518305e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2567036620385857e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2814, - "real_time": 2.4889705826110698e+05, - "cpu_time": 5.6397573240938841e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2128902901696205e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2814, - "real_time": 2.4638320194623835e+05, - "cpu_time": 5.6402503269363823e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2558745552336922e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2814, - "real_time": 2.4898495845346563e+05, - "cpu_time": 5.6398932444919285e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2114029960407224e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2814, - "real_time": 2.4638024256036794e+05, - "cpu_time": 5.6399666204688931e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2559256744910398e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4739613469077647e+05, - "cpu_time": 5.6399568336885830e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2385594355947323e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time_median", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4638320194623829e+05, - "cpu_time": 5.6399166524518305e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2558745552336922e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4107408107458155e+03, - "cpu_time": 1.8144990595823618e+01, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4119441384761795e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7023559099220293e-03, - "cpu_time": 3.2172215374841140e-05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.6904808700358554e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1641, - "real_time": 4.2646883163682884e+05, - "cpu_time": 8.5071650517970289e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9174801167788200e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1641, - "real_time": 4.2654829202852643e+05, - "cpu_time": 8.5110001645326242e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9165640542753553e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1641, - "real_time": 4.2668645110408089e+05, - "cpu_time": 8.5118111395495990e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9149720938489456e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1641, - "real_time": 4.2647769413451455e+05, - "cpu_time": 8.5044867885425966e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9173779281843081e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1641, - "real_time": 4.2653620131126518e+05, - "cpu_time": 8.5058697014019347e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9167034206074381e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2654349404304323e+05, - "cpu_time": 8.5080665691647562e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9166195227389736e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time_median", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2653620131126512e+05, - "cpu_time": 8.5071650517970289e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.9167034206074381e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.7202391589604389e+01, - "cpu_time": 3.2047456999868132e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.0049799100081554e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.0443962411205983e-04, - "cpu_time": 3.7667144161771947e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0440465351451406e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 861, - "real_time": 8.0671936622955999e+05, - "cpu_time": 1.4729545447152157e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1992107485944118e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 861, - "real_time": 8.0610110608884657e+05, - "cpu_time": 1.4716147247388437e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2031984180626020e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 861, - "real_time": 8.0602696088643512e+05, - "cpu_time": 1.4716997607431312e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2036770524242487e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 861, - "real_time": 8.0598533578361978e+05, - "cpu_time": 1.4713986202092627e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2039457962620192e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 861, - "real_time": 8.0648857008224470e+05, - "cpu_time": 1.4723444761904667e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2006986280937243e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0626426781414135e+05, - "cpu_time": 1.4720024253193843e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2021461286874008e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time_median", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0610110608884646e+05, - "cpu_time": 1.4716997607431314e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.2031984180626020e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2332857867871633e+02, - "cpu_time": 6.3836281566756747e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.0857587394902604e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.0102059781874083e-04, - "cpu_time": 4.3366967654897729e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.0094197431100160e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 445, - "real_time": 1.5769819344467157e+06, - "cpu_time": 2.7269252696631034e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3194065301345024e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 445, - "real_time": 1.5708137863430749e+06, - "cpu_time": 2.7250570494380668e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3402943575693054e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 445, - "real_time": 1.5731077366560865e+06, - "cpu_time": 2.7258024044942758e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3325069888928537e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 445, - "real_time": 1.5669014736528643e+06, - "cpu_time": 2.7239281887641787e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3536282536284313e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 445, - "real_time": 1.5732418583559522e+06, - "cpu_time": 2.7198846044944385e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3320523830748758e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5722093578909389e+06, - "cpu_time": 2.7243195033708126e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3355777026599932e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time_median", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5731077366560865e+06, - "cpu_time": 2.7250570494380668e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3325069888928537e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.7004014521036343e+03, - "cpu_time": 2.7089870375182604e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.2564167361024765e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.3536314890451908e-03, - "cpu_time": 9.9437200158293418e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.3547904390486224e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 218, - "real_time": 3.2158928854954899e+06, - "cpu_time": 5.3858120871555340e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2169697802030630e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 218, - "real_time": 3.2145218216651762e+06, - "cpu_time": 5.3835729908254035e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2191949318636513e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 218, - "real_time": 3.2168961377865677e+06, - "cpu_time": 5.3858436788983168e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2153427656336479e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 218, - "real_time": 3.2150304391382076e+06, - "cpu_time": 5.3835729908254035e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2183692557813396e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 218, - "real_time": 3.2169629484329610e+06, - "cpu_time": 5.3856977110094829e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2152344521631727e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2158608465036806e+06, - "cpu_time": 5.3848998917428283e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2170222371289759e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time_median", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2158928854954904e+06, - "cpu_time": 5.3856977110094829e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.2169697802030630e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.0920218749542132e+03, - "cpu_time": 1.2125059091588769e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7716244607929753e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.3957373377690498e-04, - "cpu_time": 2.2516777164569495e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3958537653616233e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 101, - "real_time": 6.8330636321760640e+06, - "cpu_time": 1.1052080960395627e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9105984966971874e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 101, - "real_time": 6.8273620892057912e+06, - "cpu_time": 1.1073970524752315e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.9146993467726412e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 101, - "real_time": 6.8526232504461072e+06, - "cpu_time": 1.1127624811882079e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.8965820494823790e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 101, - "real_time": 6.9800810750094382e+06, - "cpu_time": 1.1460912861386785e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.8071693780368633e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 101, - "real_time": 6.8491604547984526e+06, - "cpu_time": 1.1059517277227305e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.8990576613652115e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8684581003271714e+06, - "cpu_time": 1.1154821287128823e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.8856213864708576e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time_median", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.8491604547984526e+06, - "cpu_time": 1.1073970524752315e+07, - "time_unit": "ns", - "bytes": 3.3554432000000000e+07, - "bytes_per_second": 4.8990576613652115e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 6.3293918697629975e+04, - "cpu_time": 1.7364257464322346e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.4510591589393191e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 15, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):25/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.2151568478833767e-03, - "cpu_time": 1.5566594046969076e-02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1105282354974997e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 50, - "real_time": 1.4167133942246437e+07, - "cpu_time": 2.3148798780002836e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7369400383715696e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 50, - "real_time": 1.4230987522751093e+07, - "cpu_time": 2.3347207500000879e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7156856748495493e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 50, - "real_time": 1.4181377310305834e+07, - "cpu_time": 2.3206355120000806e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7321823918492680e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 50, - "real_time": 1.4205118399113417e+07, - "cpu_time": 2.3280875899999958e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7242734706236916e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 50, - "real_time": 1.4167889207601547e+07, - "cpu_time": 2.3201921620002393e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7366875203960409e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4190501276403666e+07, - "cpu_time": 2.3237031784001373e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7291538192180243e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time_median", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4181377310305834e+07, - "cpu_time": 2.3206355120000809e+07, - "time_unit": "ns", - "bytes": 6.7108864000000000e+07, - "bytes_per_second": 4.7321823918492680e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.7355900359201274e+04, - "cpu_time": 7.7491675728313392e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.1071788913318273e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 16, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):26/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9277613825164422e-03, - "cpu_time": 3.3348353803804740e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9257523099212111e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 26, - "real_time": 2.6665634618928798e+07, - "cpu_time": 4.3360272192304499e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0333596000270901e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 26, - "real_time": 2.6682865662643544e+07, - "cpu_time": 4.3301535884622283e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0301091980501575e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 26, - "real_time": 2.6750324795452449e+07, - "cpu_time": 4.3197325461540885e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0174242378850288e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 26, - "real_time": 2.6626219041645527e+07, - "cpu_time": 4.3230002115382589e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0408106306822157e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 26, - "real_time": 2.6693887292192534e+07, - "cpu_time": 4.3298398846157119e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0280323180676727e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6683786282172572e+07, - "cpu_time": 4.3277506900001481e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0299471969424334e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time_median", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.6682865662643544e+07, - "cpu_time": 4.3298398846157119e+07, - "time_unit": "ns", - "bytes": 1.3421772800000000e+08, - "bytes_per_second": 5.0301091980501575e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5204318801594767e+04, - "cpu_time": 6.4322870660360939e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.5172794427516591e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 17, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):27/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.6940743837315080e-03, - "cpu_time": 1.4862887275135235e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.6933138876545422e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 10, - "real_time": 5.0896696001291275e+07, - "cpu_time": 8.0828112199992567e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2741234125136461e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 10, - "real_time": 5.0996154174208641e+07, - "cpu_time": 8.0783675900011078e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2638372510012045e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 10, - "real_time": 5.0961642712354660e+07, - "cpu_time": 8.0795241500004515e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2674019461096182e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 10, - "real_time": 5.0911192595958710e+07, - "cpu_time": 8.0835311700002417e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2726216439350939e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 10, - "real_time": 5.0969769805669785e+07, - "cpu_time": 8.0766976499990046e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2665620626393280e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0947091057896622e+07, - "cpu_time": 8.0801863560000136e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2689092632397785e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time_median", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 5.0961642712354660e+07, - "cpu_time": 8.0795241500004515e+07, - "time_unit": "ns", - "bytes": 2.6843545600000000e+08, - "bytes_per_second": 5.2674019461096182e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.1718182261840018e+04, - "cpu_time": 2.9152696200963117e+04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.3149677517033657e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 18, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):28/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 8.1885307670326432e-04, - "cpu_time": 3.6079237429116379e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 8.1894895814739325e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 9, - "real_time": 9.9134230779276952e+07, - "cpu_time": 1.5704988599999422e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4155956805207558e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 9, - "real_time": 9.9137485855155528e+07, - "cpu_time": 1.5687742355554393e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4154178650888262e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 9, - "real_time": 9.9097324742211238e+07, - "cpu_time": 1.5689588044445676e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4176125682161417e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 9, - "real_time": 9.9218212068080902e+07, - "cpu_time": 1.5729261344444644e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4110117569102478e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 9, - "real_time": 9.9172240330113307e+07, - "cpu_time": 1.5699797088889986e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4135200557426653e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9151898754967600e+07, - "cpu_time": 1.5702275486666825e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4146315852957268e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time_median", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.9137485855155528e+07, - "cpu_time": 1.5699797088889986e+08, - "time_unit": "ns", - "bytes": 5.3687091200000000e+08, - "bytes_per_second": 5.4154178650888262e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.5578084338534863e+04, - "cpu_time": 1.6687742877715878e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4886055453446214e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 19, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):29/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 4.5967939001522514e-04, - "cpu_time": 1.0627595275529229e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 4.5960754783443001e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4, - "real_time": 1.6420438885688782e+08, - "cpu_time": 2.8615045775001138e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.5390567905941830e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4, - "real_time": 1.6459254920482635e+08, - "cpu_time": 2.8654213499999058e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.5236356638707104e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4, - "real_time": 1.6448822245001793e+08, - "cpu_time": 2.8634273350002104e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.5277732837454157e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4, - "real_time": 1.6477622836828232e+08, - "cpu_time": 2.8654359000000793e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.5163636443974094e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4, - "real_time": 1.6497995704412460e+08, - "cpu_time": 2.8666079749996245e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.5083167873102493e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time_mean", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6460826918482783e+08, - "cpu_time": 2.8644794274999869e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.5230292339835939e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time_median", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6459254920482635e+08, - "cpu_time": 2.8654213499999058e+08, - "time_unit": "ns", - "bytes": 1.0737418240000000e+09, - "bytes_per_second": 6.5236356638707104e+09, - "hip_id": 5.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time_stddev", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.9331715242342890e+05, - "cpu_time": 2.0180066428868429e+05, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.1625860267716967e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time_cv", - "family_index": 5, - "per_family_instance_index": 20, - "run_name": "Comm_prefetch_managed_HostToGPU/0/5/log2(N):30/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.7819101912436872e-03, - "cpu_time": 7.0449332730871989e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.7822793445641343e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8815, - "real_time": 7.9930999779130027e+04, - "cpu_time": 2.8269975757231913e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.2811049565620050e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8815, - "real_time": 7.9806262154253098e+04, - "cpu_time": 2.8244717742486118e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.2831073306262197e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8815, - "real_time": 7.9752029241268727e+04, - "cpu_time": 2.8215825263756234e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.2839798682766531e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8815, - "real_time": 7.9511089906445384e+04, - "cpu_time": 2.8187596324449137e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.2878706620735077e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8815, - "real_time": 7.9709553930768976e+04, - "cpu_time": 2.8244491117413028e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.2846640703690125e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9741987002373236e+04, - "cpu_time": 2.8232521241067292e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.2841453775814796e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time_median", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9752029241268727e+04, - "cpu_time": 2.8244491117413028e+05, - "time_unit": "ns", - "bytes": 1.0240000000000000e+03, - "bytes_per_second": 1.2839798682766531e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5356052921528433e+02, - "cpu_time": 3.1590651935910068e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4746657118784500e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 0, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):10/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9257173665701874e-03, - "cpu_time": 1.1189454766072401e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9270915544929658e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8764, - "real_time": 7.9846212602500644e+04, - "cpu_time": 2.8253962311730004e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5649306751662508e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8764, - "real_time": 7.9988776974615714e+04, - "cpu_time": 2.8258438064810238e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5603591872018855e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8764, - "real_time": 7.9533820542063637e+04, - "cpu_time": 2.8188770880877739e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5750051814961653e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8764, - "real_time": 7.9662512288961676e+04, - "cpu_time": 2.8194851962573238e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5708453589452997e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8764, - "real_time": 7.9632535710543918e+04, - "cpu_time": 2.8184110429026902e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5718131185025550e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9732771623737121e+04, - "cpu_time": 2.8216026729803625e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5685907042624313e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time_median", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9662512288961661e+04, - "cpu_time": 2.8194851962573238e+05, - "time_unit": "ns", - "bytes": 2.0480000000000000e+03, - "bytes_per_second": 2.5708453589452997e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.8232713776204986e+02, - "cpu_time": 3.6904376557498006e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.8687014227222789e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 1, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):11/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.2867277036656974e-03, - "cpu_time": 1.3079225119430856e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.2847943087948969e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8742, - "real_time": 7.9963619629171721e+04, - "cpu_time": 2.8247176721572311e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.1223294030398399e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8742, - "real_time": 7.9819428825215247e+04, - "cpu_time": 2.8255865191031864e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.1315826989556946e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8742, - "real_time": 7.9708807280520879e+04, - "cpu_time": 2.8208547060170805e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.1387044164202094e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8742, - "real_time": 7.9857956347466912e+04, - "cpu_time": 2.8209020521621022e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.1291069635917693e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8742, - "real_time": 7.9581202082703763e+04, - "cpu_time": 2.8184642747653776e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.1469441184656695e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9786202833015719e+04, - "cpu_time": 2.8221050448409963e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.1337335200946368e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time_median", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 7.9819428825215247e+04, - "cpu_time": 2.8209020521621022e+05, - "time_unit": "ns", - "bytes": 4.0960000000000000e+03, - "bytes_per_second": 5.1315826989556946e+07, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4641092182750921e+02, - "cpu_time": 2.9669946844171665e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4248960475036540e+04, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 2, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):12/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.8350406038739825e-03, - "cpu_time": 1.0513409803228405e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.8358755885190380e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8702, - "real_time": 8.0655506665299486e+04, - "cpu_time": 2.8466959032406844e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0156777061725971e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8702, - "real_time": 8.0639028112949934e+04, - "cpu_time": 2.8462781889222813e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0158852594956358e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8702, - "real_time": 8.0390973732844155e+04, - "cpu_time": 2.8464431831764837e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0190198749456267e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8702, - "real_time": 8.0433557406057938e+04, - "cpu_time": 2.8461363847391721e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0184803786116029e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8702, - "real_time": 8.0590637114350204e+04, - "cpu_time": 2.8503479050793458e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0164952522184874e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0541940606300341e+04, - "cpu_time": 2.8471803130315937e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0171116942887901e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time_median", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0590637114350189e+04, - "cpu_time": 2.8464431831764831e+05, - "time_unit": "ns", - "bytes": 8.1920000000000000e+03, - "bytes_per_second": 1.0164952522184874e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2168863809823263e+02, - "cpu_time": 1.7829236409310357e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5374422948520703e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 3, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):13/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5108729338055408e-03, - "cpu_time": 6.2620678879049692e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5115766571999929e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8522, - "real_time": 8.2181486635480047e+04, - "cpu_time": 2.8776045470546960e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.9936363615168005e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8522, - "real_time": 8.1975165204015459e+04, - "cpu_time": 2.8762507944145706e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.9986540995952088e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8522, - "real_time": 8.1913577035179900e+04, - "cpu_time": 2.8807644297112111e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 2.0001568229603097e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8522, - "real_time": 8.1941108311944161e+04, - "cpu_time": 2.8792168199952459e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.9994847931061950e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8522, - "real_time": 8.2162971297303360e+04, - "cpu_time": 2.8811910971602425e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.9940856253500330e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2034861696784588e+04, - "cpu_time": 2.8790055376671941e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.9972035405057096e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time_median", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.1975165204015459e+04, - "cpu_time": 2.8792168199952459e+05, - "time_unit": "ns", - "bytes": 1.6384000000000000e+04, - "bytes_per_second": 1.9986540995952088e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2745026476088799e+02, - "cpu_time": 2.0896409272722877e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.1014622844716330e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 4, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):14/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.5536110151799462e-03, - "cpu_time": 7.2582039177510082e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.5529024566451125e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 8292, - "real_time": 8.4780401214261714e+04, - "cpu_time": 2.9190081922332977e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8650442237454027e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 8292, - "real_time": 8.4494668256846169e+04, - "cpu_time": 2.9152442486735247e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8781145220183730e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 8292, - "real_time": 8.4333878750819902e+04, - "cpu_time": 2.9136380559576669e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8855084676964921e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 8292, - "real_time": 8.4498803303244829e+04, - "cpu_time": 2.9167102243126149e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8779247420113081e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 8292, - "real_time": 8.4504815994216202e+04, - "cpu_time": 2.9161467836469732e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8776488197125661e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4522513503877781e+04, - "cpu_time": 2.9161495009648160e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8768481550368291e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time_median", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4498803303244844e+04, - "cpu_time": 2.9161467836469726e+05, - "time_unit": "ns", - "bytes": 3.2768000000000000e+04, - "bytes_per_second": 3.8779247420113081e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6104337495492871e+02, - "cpu_time": 1.9756879531930340e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.3779671660966345e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 5, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):15/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.9053311156860032e-03, - "cpu_time": 6.7749885681079528e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9030838637595661e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7610, - "real_time": 8.9833033150855903e+04, - "cpu_time": 3.0071322299604717e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2953119472149968e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7610, - "real_time": 8.9849870538069168e+04, - "cpu_time": 3.0062114835743693e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2939448446097159e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7610, - "real_time": 8.9881791415663785e+04, - "cpu_time": 3.0074579724047327e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2913544520852721e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7610, - "real_time": 8.9894737744082493e+04, - "cpu_time": 3.0102816281211487e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2903043764999509e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7610, - "real_time": 9.0046208583801534e+04, - "cpu_time": 3.0118513823917328e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2780410225721943e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9901128286494582e+04, - "cpu_time": 3.0085869392904907e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2897913285964262e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time_median", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.9881791415663785e+04, - "cpu_time": 3.0074579724047321e+05, - "time_unit": "ns", - "bytes": 6.5536000000000000e+04, - "bytes_per_second": 7.2913544520852721e+08, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.4745723400643868e+01, - "cpu_time": 2.3749786483307057e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 6.8648596134225500e+05, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 6, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):16/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 9.4265472542878889e-04, - "cpu_time": 7.8940003937223496e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 9.4170865858574690e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 7015, - "real_time": 9.6781413510713290e+04, - "cpu_time": 3.1634006585888023e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3543096266670139e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 7015, - "real_time": 9.9664518699837892e+04, - "cpu_time": 3.1660107940127968e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3151320220062749e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 7015, - "real_time": 9.6821396517909539e+04, - "cpu_time": 3.1700416949392605e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3537503559531386e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 7015, - "real_time": 9.6993303981543926e+04, - "cpu_time": 3.1696348724162957e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3513510172304330e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 7015, - "real_time": 9.9368854012627067e+04, - "cpu_time": 3.1692280741268600e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3190451002216885e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.7925897344526340e+04, - "cpu_time": 3.1676632188168028e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3387176244157100e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time_median", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 9.6993303981543941e+04, - "cpu_time": 3.1692280741268600e+05, - "time_unit": "ns", - "bytes": 1.3107200000000000e+05, - "bytes_per_second": 1.3513510172304330e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4581172677206546e+03, - "cpu_time": 2.8676325670859353e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.9824133113903366e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 7, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):17/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4890006701604735e-02, - "cpu_time": 9.0528328581504437e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4808300684437250e-02, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 6002, - "real_time": 1.1694178033477906e+05, - "cpu_time": 3.5034565294903488e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2416624687048402e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 6002, - "real_time": 1.1664264220556423e+05, - "cpu_time": 3.5032668593799399e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2474113672597761e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 6002, - "real_time": 1.1764109574363998e+05, - "cpu_time": 3.5175805398197187e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2283369458854456e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 6002, - "real_time": 1.1686097558610521e+05, - "cpu_time": 3.5095460263242910e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2432124897575212e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 6002, - "real_time": 1.1678643826270479e+05, - "cpu_time": 3.5080245801399276e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2446441889966817e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1697458642655870e+05, - "cpu_time": 3.5083749070308456e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2410534921208529e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time_median", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.1686097558610523e+05, - "cpu_time": 3.5080245801399276e+05, - "time_unit": "ns", - "bytes": 2.6214400000000000e+05, - "bytes_per_second": 2.2432124897575212e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.8852446186801859e+02, - "cpu_time": 5.8420996400073261e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.4171819406780088e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 8, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):18/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.3214433471149712e-03, - "cpu_time": 1.6651868157817613e-03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.3096853630471147e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 4365, - "real_time": 1.6096995623125124e+05, - "cpu_time": 4.2273608911796176e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2570549950749941e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 4365, - "real_time": 1.6071479529196254e+05, - "cpu_time": 4.2251560137458134e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2622261008860583e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 4365, - "real_time": 1.6096850866739897e+05, - "cpu_time": 4.2296578235968074e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2570842852455668e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 4365, - "real_time": 1.6093775222276925e+05, - "cpu_time": 4.2283772348227981e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2577067391514397e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 4365, - "real_time": 1.6075271944996002e+05, - "cpu_time": 4.2258272760591353e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2614564891588235e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6086874637266845e+05, - "cpu_time": 4.2272758478808345e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2591057219033766e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time_median", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.6093775222276925e+05, - "cpu_time": 4.2273608911796176e+05, - "time_unit": "ns", - "bytes": 5.2428800000000000e+05, - "bytes_per_second": 3.2577067391514397e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.2462036378641309e+02, - "cpu_time": 1.8361747552012633e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5254559538269518e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 9, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):19/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 7.7467106940535006e-04, - "cpu_time": 4.3436359993440017e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.7489230768250134e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 2774, - "real_time": 2.4909939978964339e+05, - "cpu_time": 5.6966258327322640e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2094681917559395e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 2774, - "real_time": 2.5176030215674642e+05, - "cpu_time": 5.6982819718816655e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1649775243245244e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 2774, - "real_time": 2.4946549084026128e+05, - "cpu_time": 5.7029779235759575e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2032907897125874e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 2774, - "real_time": 2.5202579451642634e+05, - "cpu_time": 5.7021997152122424e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1605899983846965e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 2774, - "real_time": 2.4922767546794709e+05, - "cpu_time": 5.7004793763514922e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2073016089854598e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.5031573255420494e+05, - "cpu_time": 5.7001129639507248e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.1891256226326418e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time_median", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.4946549084026125e+05, - "cpu_time": 5.7004793763514911e+05, - "time_unit": "ns", - "bytes": 1.0485760000000000e+06, - "bytes_per_second": 4.2032907897125874e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.4489080233379000e+03, - "cpu_time": 2.6556260383540206e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.4198404182596836e+07, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 10, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):20/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 5.7883218467866156e-03, - "cpu_time": 4.6589007185454396e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 5.7764809085360950e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 1628, - "real_time": 4.2972306977483811e+05, - "cpu_time": 8.5732849508600484e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8802406654565783e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 1628, - "real_time": 4.2981112731108099e+05, - "cpu_time": 8.5759601289920707e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8792408263599024e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 1628, - "real_time": 4.2992425059281284e+05, - "cpu_time": 8.5757788943487697e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8779569822085733e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 1628, - "real_time": 4.3007275832234026e+05, - "cpu_time": 8.5797480159700860e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8762725827618713e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 1628, - "real_time": 4.2984229061296047e+05, - "cpu_time": 8.5743679606886755e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8788870843988733e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2987469932280655e+05, - "cpu_time": 8.5758279901719303e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8785196282371597e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time_median", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 4.2984229061296053e+05, - "cpu_time": 8.5757788943487708e+05, - "time_unit": "ns", - "bytes": 2.0971520000000000e+06, - "bytes_per_second": 4.8788870843988733e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.3206621497618215e+02, - "cpu_time": 2.4487347937683535e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4985746401164008e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 11, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):21/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 3.0722025554011368e-04, - "cpu_time": 2.8553916852980878e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 3.0717815122492534e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 862, - "real_time": 8.0926739671505254e+05, - "cpu_time": 1.4794024222736207e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1828406989152889e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 862, - "real_time": 8.0906637250651058e+05, - "cpu_time": 1.4785273979119295e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1841284504334631e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 862, - "real_time": 8.0898730583994568e+05, - "cpu_time": 1.4788674675174279e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1846351231002169e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 862, - "real_time": 8.0931807256124390e+05, - "cpu_time": 1.4787452412991626e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1825161728148642e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 862, - "real_time": 8.0880037922976131e+05, - "cpu_time": 1.4779192354988821e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1858333746014423e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0908790537050297e+05, - "cpu_time": 1.4786923529002047e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1839907639730549e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time_median", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.0906637250651070e+05, - "cpu_time": 1.4787452412991624e+06, - "time_unit": "ns", - "bytes": 4.1943040000000000e+06, - "bytes_per_second": 5.1841284504334631e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.1121629288721783e+02, - "cpu_time": 5.3911536081128065e+02, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3533697676540583e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 12, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):22/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.6105481429795479e-04, - "cpu_time": 3.6458926683018080e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.6106716413530493e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 443, - "real_time": 1.5805256337507651e+06, - "cpu_time": 2.7354371376979630e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3074798793948631e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 443, - "real_time": 1.5759599811878919e+06, - "cpu_time": 2.7326642099319901e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3228559735869827e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 443, - "real_time": 1.5801131624400481e+06, - "cpu_time": 2.7349041444694675e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3088653391419849e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 443, - "real_time": 1.5766975045746558e+06, - "cpu_time": 2.7338569074490028e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3203661296229343e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 443, - "real_time": 1.5805826796235570e+06, - "cpu_time": 2.7363224266365715e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3072883235680466e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5787757923153839e+06, - "cpu_time": 2.7346369652369996e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3133711290629625e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time_median", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 1.5801131624400481e+06, - "cpu_time": 2.7349041444694675e+06, - "time_unit": "ns", - "bytes": 8.3886080000000000e+06, - "bytes_per_second": 5.3088653391419849e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 2.2562921951934313e+03, - "cpu_time": 1.4188634957706295e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 7.5977265783706643e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 13, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):23/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 1.4291403543022553e-03, - "cpu_time": 5.1884894185494292e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.4299258218220038e-03, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 0, - "threads": 1, - "iterations": 216, - "real_time": 3.2298926757734823e+06, - "cpu_time": 5.4086677129629590e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1943571146624117e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 1, - "threads": 1, - "iterations": 216, - "real_time": 3.2288911601494034e+06, - "cpu_time": 5.4094870185184414e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1959682652244329e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 2, - "threads": 1, - "iterations": 216, - "real_time": 3.2304549423753526e+06, - "cpu_time": 5.4109335324070612e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1934530272890043e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 3, - "threads": 1, - "iterations": 216, - "real_time": 3.2310082600883176e+06, - "cpu_time": 5.4127214259256953e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1925636363249054e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "iteration", - "repetitions": 5, - "repetition_index": 4, - "threads": 1, - "iterations": 216, - "real_time": 3.2306638205665406e+06, - "cpu_time": 5.4091271805555578e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1931172451913891e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time_mean", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "mean", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2301821717906194e+06, - "cpu_time": 5.4101873740739431e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1938918577384300e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time_median", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "median", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 3.2304549423753517e+06, - "cpu_time": 5.4094870185184404e+06, - "time_unit": "ns", - "bytes": 1.6777216000000000e+07, - "bytes_per_second": 5.1934530272890043e+09, - "hip_id": 6.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time_stddev", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "stddev", - "aggregate_unit": "time", - "iterations": 5, - "real_time": 8.2754610229075183e+02, - "cpu_time": 1.6509125605178856e+03, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 1.3308550706970312e+06, - "hip_id": 0.0000000000000000e+00, - "numa_id": 0.0000000000000000e+00 - }, - { - "name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time_cv", - "family_index": 6, - "per_family_instance_index": 14, - "run_name": "Comm_prefetch_managed_HostToGPU/0/6/log2(N):24/manual_time", - "run_type": "aggregate", - "repetitions": 5, - "threads": 1, - "aggregate_name": "cv", - "aggregate_unit": "percentage", - "iterations": 5, - "real_time": 2.5619177441995786e-04, - "cpu_time": 3.0514886941424485e-04, - "time_unit": "ns", - "bytes": 0.0000000000000000e+00, - "bytes_per_second": 2.5623465161566219e-04, - "hip_id": 0.0000000000000000e+00, - "numa_id": NaN - } \ No newline at end of file